Read in the data
#data<- read.table(file.choose(),sep="\t",header=T)
##first set path to /group/bprice5
### Image of how to
dat<- read.csv("/group/bprice5/1314C-08.CSV",header=T)
head(dat)
## PIDM FILE.CREATION.DATE TERM.CODE AID.YEAR PERM.CITY PERM.STATE
## 1 2266315 20160728 201308 1314 Morgantown WV
## 2 2266316 20160728 201308 1314 Bethel Park PA
## 3 2266341 20160728 201308 1314 Houston TX
## 4 2266366 20160728 201308 1314 Pittsburgh PA
## 5 2266371 20160728 201308 1314 Fairmont WV
## 6 2266376 20160728 201308 1314 Frederick MD
## PERM.ZIP.CODE PERM.CNTY.CODE X_ PERM.NATN.CODE
## 1 26505-3904 54061 Monongalia, WV 2455
## 2 15102-1368 42003 Allegheny, PA NA
## 3 77042 39015 Brown, OH NA
## 4 15241-3246 42003 Allegheny, PA NA
## 5 26554-2217 54049 Marion, WV NA
## 6 21701-4472 24021 Frederick, MD NA
## PERM.NATN.DESC PERM.PHONE..NULLED. MAIL.ADDR.LINE.1..NULLED.
## 1 Saudi Arabia NA NA
## 2 NA NA
## 3 NA NA
## 4 NA NA
## 5 NA NA
## 6 NA NA
## MAIL.ADDR.LINE.2..NULLED. MAIL.ADDR.LINE.3..NULLED. MAIL.CITY
## 1 NA NA Morgantown
## 2 NA NA Bethel Park
## 3 NA NA Morgantown
## 4 NA NA Pittsburgh
## 5 NA NA Fairmont
## 6 NA NA Frederick
## MAIL.STATE MAIL.ZIP.CODE MAIL.CNTY.CODE MAIL.CNTY.DESC MAIL.NATN.CODE
## 1 WV 26505-3904 54061 Monongalia, WV NA
## 2 PA 15102-1368 42003 Allegheny, PA NA
## 3 WV 26505-2558 54061 Monongalia, WV NA
## 4 PA 15241-3246 42003 Allegheny, PA NA
## 5 WV 26554-2217 54049 Marion, WV NA
## 6 MD 21701-4472 24021 Frederick, MD NA
## MAIL.NATN.DESC MAIL.PHONE..NULLED. ADM.ADDR.STATE.CODE ADM.ADDR.ZIP.CODE
## 1 NA WV 26508-9247
## 2 NA PA 15102-1368
## 3 NA TX 77042
## 4 NA PA 15241-3246
## 5 NA WV 26554-2217
## 6 NA MD 21701-4472
## ADM.CNTY.CODE ETHNIC.CODE ETHNIC.DESC BIRTH.DATE LEGACY
## 1 54061 4 Asian/Pacific Islander 26-Dec-84
## 2 42003 6 Race/Ethnicity Unknown 4-Jan-94 P
## 3 39015 1 White Caucasian 25-May-90
## 4 42003 1 White Caucasian 1-Aug-93 H
## 5 54049 6 Race/Ethnicity Unknown 25-Jun-77
## 6 24021 6 Race/Ethnicity Unknown 26-Nov-94 B
## LEGACY.DESC SEX.CODE CONFID.IND DEAD.IND DEAD.DATE
## 1 F N
## 2 Father and Mother are Alumni F N
## 3 M N
## 4 Husband is Alumnus M N
## 5 M N
## 6 Brother M N
## CITIZENSHIP.CODE STUDENTS.MAIN.PIN..NULLED. TERM.PIN..NULLED.
## 1 4 NA NA
## 2 1 NA NA
## 3 4 NA NA
## 4 1 NA NA
## 5 1 NA NA
## 6 1 NA NA
## VISA.TYPE.CODE.CURRENT LEGAL.NATION.CODE LEGAL.NATION.DESCR
## 1 F1 2455 Saudi Arabia
## 2 NA
## 3 F1 2455 Saudi Arabia
## 4 NA
## 5 NA
## 6 NA
## GS.ORIGL.TERM.OF.ENTRY.AT.WVU GS.TERM.CODE.EFFECTIVE GS.STATUS.CODE
## 1 201105 201308 AS
## 2 201208 201305 AS
## 3 201108 201305 AS
## 4 201208 201308 AS
## 5 201205 201308 AS
## 6 201208 201305 AS
## GS.TERM.CODE.ADMIT GS.ADMIT.TYPE.CODE GS.ADMIT.TYPE.DESC
## 1 201308 7 Masters
## 2 201208 1 First Time Freshman
## 3 201108 4 Transfer
## 4 201208 1 First Time Freshman
## 5 201205 1 First Time Freshman
## 6 201301 4 Transfer
## STUDENT.CODE.STATUS..FTF..FTT..FTG..FTP. GS.STUDENT.TYPE.CODE
## 1 FTG A
## 2 B
## 3 B
## 4 B
## 5 B
## 6 B
## GS.LEVEL.CODE GS.EXPECTED.GRAD..DATE UNUSED.NULLED. GS.SITE.CODE
## 1 GR 20160531 NA
## 2 UG 20180531 NA
## 3 UG 20150531 NA
## 4 UG 20170531 NA
## 5 UG 20150531 NA
## 6 UG 20180531 NA
## GS.RESIDENCY GS.COLLEGE.CODE GS.COLLEGE.DESC
## 1 N 14 Arts and Sciences
## 2 N 49 Reed College of Media
## 3 N 30 Engineering Mineral Resources
## 4 N 30 Engineering Mineral Resources
## 5 R 41 University College
## 6 N 30 Engineering Mineral Resources
## GS.DEGREE.CODE GS.DEGREE.DESC GS.MAJOR.CODE.1
## 1 MPS Master of Professional Studies 1478
## 2 BSJ BS in Journalism 4930
## 3 BSCHE BS in Chemical Engineering 3010
## 4 BSPNGE BS in Petroleum & Natl Gas Eng 3075
## 5 BA Bachelor of Arts 4132
## 6 BS Bachelor of Science 3049
## GS.MAJOR.CODE.1.DESC GS.MAJOR.CODE.2 GS.MAJOR.CODE.2.DESC
## 1 Applied Statistics
## 2 Direct Admit Journalism Prg
## 3 Chemical Engineering
## 4 Petroleum & Natural Gas Engr
## 5 Regents Bachelor of Arts
## 6 General Engineering
## GS.CLASSIFICATION..RANK. GS.ATTRIBUTE ACADEMIC.COMMON.MARKET
## 1 GR
## 2 SO ACM
## 3 SR ARO
## 4 SO
## 5 SR
## 6 SO
## ACADEMIC.COMMON.MARKET.DESC HIGH.SCHOOL.CODE
## 1 490075
## 2 Active/Academic Common Market 392270
## 3 Active/Reciprocity Ohio 363535
## 4 393707
## 5 491275
## 6 210535
## HIGH.SCHOOL.NAME HIGH.SCHOOL.STATE.CODE
## 1 Woodrow Wilson High School WV
## 2 Bethel Park Sr High School PA
## 3 Western Brown High School OH
## 4 Upper Saint Clair High School PA
## 5 Tucker County High School WV
## 6 Governor Thomas Johnson High MD
## HIGH.SCHOOL.ZIP.CODE WEIGHTED.GPA.IND HIGH.SCHOOL.GPA
## 1 25801-3158 NA
## 2 15102-1607 W 3.35
## 3 45154-0386 NW 2.79
## 4 15241-2331 W 3.45
## 5 26269-9302 NW 2.63
## 6 21701-4430 W 3.11
## HIGH.SCHOOL.GRAD..DATE PREVIOUS.COLL.CODE PREVIOUS.COLL.NAME
## 1 19880601 I03099 Al Jouf University
## 2 20120601 5904 West Virginia University
## 3 20110527 6827 Texas Tech University
## 4 20120601 5904 West Virginia University
## 5 19950604 0000AF Service in the Armed Forces
## 6 20120501 5230 Frederick Community College
## PREVIOUS.COLL.GPA ACT.DATE..FROM.HIGHEST.A05.
## 1 2.66
## 2 NA
## 3 3.16 1-Apr-10
## 4 4.00 1-Jun-11
## 5 3.65
## 6 4.00 1-Oct-11
## ACT.COMP.SCORE..HIGHEST.A05. ACT.ENGL..FROM.HIGHEST.A05.
## 1 NA NA
## 2 NA NA
## 3 21 21
## 4 26 26
## 5 NA NA
## 6 24 23
## ACT.MATH..FROM.HIGHEST.A05. ACT.READ..FROM.HIGHEST.A05.
## 1 NA NA
## 2 NA NA
## 3 17 22
## 4 27 22
## 5 NA NA
## 6 26 23
## ACT.SCI.REASON..FROM.HIGHEST.A05.
## 1 NA
## 2 NA
## 3 24
## 4 27
## 5 NA
## 6 24
## ACT.SUM.OF.STANDARD.SCORES..FROM.HIGHEST.A05.
## 1 NA
## 2 NA
## 3 84
## 4 120
## 5 NA
## 6 96
## SAT.RE.CENTERED.IND..FROM.HIGHEST.SMV. SAT.DATE..FROM.HIGHEST.SMV.
## 1
## 2 R 1-May-11
## 3 R 1-Mar-09
## 4 R 1-May-11
## 5 R 1-Nov-10
## 6
## SAT.TOTAL..HIGHEST.SMV. SAT.MATH..FROM.HIGHEST.SMV.
## 1 NA NA
## 2 1050 520
## 3 1030 660
## 4 1180 630
## 5 1070 590
## 6 NA NA
## SAT.VERBAL..FROM.HIGHEST.SMV. HIGHEST.ACT.ENGL HIGHEST.ACT.MATH
## 1 NA NA NA
## 2 530 NA NA
## 3 370 21 17
## 4 550 26 27
## 5 480 NA NA
## 6 NA 23 26
## HIGHEST.ACT.READING HIGHEST.ACT.SCI.REASON
## 1 NA NA
## 2 NA NA
## 3 24 24
## 4 22 27
## 5 NA NA
## 6 23 24
## HIGHEST.ACT.SUM.OF.STANDARD.SCORES HIGHEST.SAT.VERBAL HIGHEST.SAT.MATH
## 1 NA NA NA
## 2 NA 530 520
## 3 84 370 660
## 4 120 550 640
## 5 NA 490 590
## 6 96 NA NA
## GRE.VERBAL..MAX. GRE.QUANT..MAX. GRE.ANALYTIC..MAX. GRE.WRITING.ASSESS
## 1 520 600 600 NA
## 2 NA NA NA NA
## 3 NA NA NA NA
## 4 NA NA NA NA
## 5 380 400 410 NA
## 6 NA NA NA NA
## GRE.CHEM.TOTAL GRE.COMP.SCI.TOTAL GRE.ENGR.TOTAL GRE.MATH.TOTAL
## 1 NA NA NA NA
## 2 NA NA NA NA
## 3 NA NA NA NA
## 4 NA NA NA NA
## 5 NA NA NA NA
## 6 NA NA NA NA
## HRS.REG.FOR.SPRING.TERM..RE.RR.RW. HRS.REG.FOR.SUMMER.I.TERM..RE.RR.RW.
## 1 9 3
## 2 13 NA
## 3 8 10
## 4 14 4
## 5 6 6
## 6 19 6
## HRS.REG.FOR.SUMMER.II.TERM..RE.RR.RW. HRS.REG.FOR.FALL.TERM..RE.RR.RW.
## 1 NA 9
## 2 NA 18
## 3 NA 13
## 4 NA 14
## 5 NA 6
## 6 NA 15
## HRS.REG.FOR.EXTRA.TERM..RE.RR.RW. SPORTS.CODE SPORTS.DESC HONORS.CODE
## 1 NA
## 2 NA
## 3 NA
## 4 NA HONORS-SO DEAN
## 5 NA
## 6 NA
## SCHOLARS.CODE SENIOR.CITZ.CODE..SERIES.67. EXCHANGE.STUDENT.CODE
## 1 NA
## 2 NA
## 3 NA
## 4 NA
## 5 NA
## 6 NA
## WEEBLES.CODE SSS.TRIO.CODE UNUSED.CODE.G UNUSED.CODE.H PROMISE.CODE
## 1 NA NA
## 2 NA NA
## 3 NA NA
## 4 NA NA PROMISE
## 5 NA NA PROMISE
## 6 NA NA PROMISE
## UNUSED.CODE.J VETERAN.CODE VETERAN.DESC BOT.INSTIT..NULLED.
## 1 NA
## 2 NA
## 3 NA
## 4 NA
## 5 I 33 NA
## 6 NA
## BOT.YR.OF.REPORT..NULLED. BOT.LEVL.CODE..NULLED.
## 1 NA NA
## 2 NA NA
## 3 NA NA
## 4 NA NA
## 5 NA NA
## 6 NA NA
## FILLER..WAS.SCHOOL.BUDGET. UNMET.NEED FED.PELL.GRANT FED.SUPPL.ED.OPP
## 1 0 0 0 0
## 2 0 550 795 0
## 3 0 0 0 0
## 4 0 6 3295 0
## 5 0 0 0 0
## 6 0 0 0 0
## OTHER.FED.GRANTS.AND.SCHOLARS WV.HIGHER.ED.GRANT.PROG PROMISE.SCHOLARS
## 1 0 0 0
## 2 0 0 0
## 3 0 0 0
## 4 0 0 0
## 5 0 0 0
## 6 0 0 0
## HEAPS..NOT.WF.DEVLPMNT.COMP. HEAPS.WF.DEVLPMNT.COMP
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 0 0
## UNDERWOOD.SMITH.TEACHER.SCHOLARS WV.ENG..SCI..AND.TECH.SCHOLARS
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 0 0
## OTHER.WV.STATE.GRANTS.AND.SCHOLARS OUT.OF.STATE.GRANTS.AND.SCHOLARS
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 556
## 5 0 0
## 6 0 0
## MISC.GRANTS.AND.SCHOLARS PROC..RULE.NO..49.UG.TUI.FEE.WAIV.ATHL
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 0 0
## PROC..RULE.NO..49.UG.TUI.FEE.WAIV.ACAD
## 1 0
## 2 3000
## 3 0
## 4 4000
## 5 0
## 6 1500
## PROC..RULE.NO..49.UG.TUI.FEE.WAIV.NEED...OTHER
## 1 0
## 2 0
## 3 0
## 4 0
## 5 0
## 6 0
## PROC..RULE.NO..49.GR...PR.TUI.FEE.WAIVS
## 1 0
## 2 0
## 3 0
## 4 0
## 5 0
## 6 0
## INST.GRANTS.AND.SCHOLARS.ATHLETIC INST.GRANTS.AND.SCHOLARS.ACADEMIC
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 0 0
## INST.GRANTS.AND.SCHOLARS.OTHER FED.WORK.STUDY..FWS..PROGRAM
## 1 0 0
## 2 1500 0
## 3 0 0
## 4 2000 0
## 5 0 0
## 6 0 0
## OTHER.FED.EMPLOYMENT INST.EMPLOYMENT
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 0 0
## FILLER..WAS.FED.STAFFORD.LOAN....SUBSIDIZED.
## 1 0
## 2 0
## 3 0
## 4 0
## 5 0
## 6 0
## FILLER..WAS.FED.STAFFORD.LOAN....UNSUBSIDIZED.
## 1 0
## 2 0
## 3 0
## 4 0
## 5 0
## 6 0
## FED.DIRECT.LOAN....SUBSIDIZED FED.DIRECT.LOAN....UNSUBSIDIZED
## 1 0 0
## 2 4454 1980
## 3 0 0
## 4 4454 1980
## 5 0 0
## 6 0 0
## FED.DIRECT.PLUS FED.PERKINS.LOAN FILLER..WAS.FED.PLUS. OTHER.FED.LOANS
## 1 0 0 0 0
## 2 18456 0 0 0
## 3 0 0 0 0
## 4 14027 0 0 0
## 5 0 0 0 0
## 6 0 0 0 0
## MED.STUDENT.LOAN INST.LOANS MISC.LOANS VETS.AND.ACTIVE.DUTY.MIL.BENS
## 1 0 0 0 0
## 2 0 0 0 0
## 3 0 0 0 0
## 4 0 0 0 0
## 5 0 0 0 7789
## 6 0 0 30419 0
## VOC.REHAB.BENS OTHER.ED.BENS BOT.STATE.CODE.NULLED. NSLDS.SUB
## 1 0 24369 NA NA
## 2 0 0 NA 3500
## 3 0 0 NA 8000
## 4 0 0 NA 3500
## 5 0 0 NA NA
## 6 0 0 NA 3500
## NSLDS.UNSUB NSLDS.SUB.AND.UNSUB.TOTAL NSLDS.PERKINS.TOTAL
## 1 NA NA NA
## 2 2000 5500 NA
## 3 3980 11980 NA
## 4 2000 5500 NA
## 5 12000 12000 NA
## 6 2000 5500 NA
## FATHERS.HI.GRADE MOTHERS.HI.GRADE EXPECTED.TOT.FAM.CONT..EFC.
## 1 NA NA NA
## 2 2 3 4834
## 3 3 3 46
## 4 3 2 2396
## 5 3 2 13870
## 6 2 3 21298
## SPRING.TERM.ORIENTATION.IND SUM.I.TERM...ORIEN.IND
## 1
## 2
## 3
## 4
## 5
## 6
## SUM.II.TERM...ORIEN.IND FALL.TERM...ORIEN.IND EXTRA.TERM...ORIEN.IND
## 1 NA NA
## 2 NA NA
## 3 NA NA
## 4 NA NA
## 5 NA NA
## 6 NA NA
## SPRING.TERM.APPLICATION.IND SUM.I.TERM...APPL.IND SUM.II.TERM...APPL.IND
## 1 NA
## 2 NA
## 3 NA
## 4 NA
## 5 Y NA
## 6 NA
## FALL.TERM...APPL.IND EXTRA.TERM...APPL.IND SPRING.TERM.ADM.DEC.MADE.IND
## 1 Y NA
## 2 Y NA
## 3 NA
## 4 NA
## 5 NA
## 6 Y NA
## SUM.I.TERM...ADM.DEC.MADE.IND SUM.II.TERM...ADM.DEC.MADE.IND
## 1 NA
## 2 NA
## 3 NA
## 4 NA
## 5 Y NA
## 6 NA
## FALL.TERM...ADM.DEC.MADE.IND EXTRA.TERM...ADM.DEC.MADE.IND
## 1 Y NA
## 2 Y NA
## 3 NA
## 4 NA
## 5 NA
## 6 Y NA
## SPRING.TERM.ENR.IND SUM.I.TERM...ENR.IND SUM.II.TERM...ENR.IND
## 1 Y Y NA
## 2 Y NA
## 3 Y Y NA
## 4 Y Y NA
## 5 Y Y NA
## 6 Y Y NA
## FALL.TERM...ENR.IND EXTRA.TERM...ENR.IND SPRING.TERM.REG.IND
## 1 Y NA Y
## 2 Y NA Y
## 3 Y NA Y
## 4 Y NA Y
## 5 Y NA Y
## 6 Y NA Y
## SUM.I.TERM...REG.IND SUM.II.TERM...REG.IND FALL.TERM...REG.IND
## 1 Y NA Y
## 2 NA Y
## 3 Y NA Y
## 4 Y NA Y
## 5 Y NA Y
## 6 Y NA Y
## EXTRA.TERM...REG.IND SPRING.TERM.APPL.FOR.DEGR.IND
## 1 NA NA
## 2 NA NA
## 3 NA NA
## 4 NA NA
## 5 NA NA
## 6 NA NA
## SUM.I.TERM...APPL.FOR.DEGR.IND SUM.II.TERM...APPL.FOR.DEGR.IND
## 1 NA NA
## 2 NA NA
## 3 NA NA
## 4 NA NA
## 5 NA NA
## 6 NA NA
## FALL.TERM...APPL.FOR.DEGR.IND EXTRA.TERM...APPL.FOR.DEGR.IND
## 1 NA NA
## 2 NA NA
## 3 NA NA
## 4 NA NA
## 5 NA NA
## 6 NA NA
## SPRING.TERM.GRAD.IND SUM.I.TERM...GRAD.IND SUM.II.TERM...GRAD.IND
## 1 Y NA
## 2 NA
## 3 Y NA
## 4 NA
## 5 NA
## 6 NA
## FALL.TERM...GRAD.IND EXTRA.TERM...GRAD.IND BORN.BEFORE.DATE.IND
## 1 Y NA NA
## 2 NA 2
## 3 NA 2
## 4 NA 2
## 5 NA 2
## 6 NA 2
## GRAD.OR.PROF.IND MARRIED.IND HAVE.CHILD.SUPPORT.IND US.INCOME
## 1 NA NA NA NA
## 2 2 2 2 2130
## 3 2 2 2 3715
## 4 2 2 2 NA
## 5 2 2 2 5296
## 6 2 2 2 2900
## USER.DEFINES.FIELD..VARIES. STD.CAMP.CODE DEPEND.STAT AGI.FOR.PAR
## 1 NA SWA NA
## 2 NA SWA D 68307
## 3 NA SWA D 36414
## 4 NA SWA D 59068
## 5 NA SWA D 119268
## 6 NA SWA D 123000
## NUM.IN.PARS.HOUSE NUM.IN.STUDS.HOUSE ACAD.EXCEL.L1.WAIV....0WVAE1
## 1 NA NA 0
## 2 5 5 0
## 3 4 NA 0
## 4 4 NA 0
## 5 4 NA 0
## 6 4 NA 0
## ACAD.EXCEL.L2.WAIV....0WVAE2 BLUE...GOLD.WAIV.LEVEL.1...0WVBG1
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 4000
## 5 0 0
## 6 0 0
## BLUE...GOLD.WAIV.LEVEL.2...0WVBG2 SCHOLAR.S.WAIV.EQUIVALENT...0WVEQV
## 1 0 0
## 2 3000 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 1500 0
## FILLER..WAS.ACADC.COMP.GRANT. FILLER..WAS.NATN.SMART.GRANT.
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 0 0
## GEAR.UP..GAINING.EARLY.AWARE.READ..UG.PROGS. FED.DIRECT.GRAD.PLUS
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 0 0
## FILLER..WAS.STAFFORD.GRAD.PLUS. OTHER.CATS.UNDER.PB.49 NEW.ETHNIC.CODE
## 1 0 0 1
## 2 0 0 1
## 3 0 0 1
## 4 0 0 1
## 5 0 0 1
## 6 0 0 1
## AMER.IND.OR.ALSK.NATV.IND ASIAN.IND BLACK.OR.AFRICAN.AMER.IND
## 1 N N N
## 2 N N N
## 3 N N N
## 4 N N N
## 5 N N N
## 6 N N N
## NATV.HAWAIIAN.OR.PACIF.ISL.IND WHITE.IND HISPANIC.IND UNKNOWN.RACE.IND
## 1 N Y N N
## 2 N Y N N
## 3 N N N Y
## 4 N Y N N
## 5 N Y N N
## 6 N Y N N
## EXTRA.RACE.CODES UG.TUI.FEE.WAIVS.CHILD.SPOUS
## 1 NA 0
## 2 NA 0
## 3 NA 0
## 4 NA 0
## 5 NA 0
## 6 NA 0
## UG.TUI.FEE.WAIVS.INDS.OVER.65 UG.TUI.FEE.WAIVS.HS.GRADS.IN.FOSTER.CARE
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 0 0
## UG.TUI.FEE.WAIVS.PRPL.HRT.MDL.OF.HNR.RECIPS
## 1 0
## 2 0
## 3 0
## 4 0
## 5 0
## 6 0
## UG.TUI.FEE.WAIVS.CHILD.SPOUS.OF.ARMED.FORCES.KILL.IN.ACT..ETC.
## 1 0
## 2 0
## 3 0
## 4 0
## 5 0
## 6 0
## UG.TUI.FEE.WAIVS.HLTH.SCI.TECH.ACAD..HSTA.
## 1 0
## 2 0
## 3 0
## 4 0
## 5 0
## 6 0
## UG.TUI.FEE.WAIVS.EMP.OF.THE.INST
## 1 0
## 2 0
## 3 0
## 4 0
## 5 0
## 6 0
## UG.TUI.FEE.WAIVS.SPOUS.DEPEND.OF.EMP.OF.THE.INST YELLOW.RIBBON.IND
## 1 0 N
## 2 0 N
## 3 0 N
## 4 0 N
## 5 0 N
## 6 0 N
## YELLOW.RIBBON.INST.AMT YELLOW.RIBBON.VETS.ADMIN.AMT
## 1 0 0
## 2 0 0
## 3 0 0
## 4 0 0
## 5 0 0
## 6 0 0
## IPEDS.LIVING.ARRANGE.CODE HEPC.ID..NULLED. GED.SCORE TASCP.SCORE
## 1 NA NA
## 2 NA NA
## 3 NA NA
## 4 NA NA
## 5 NA NA
## 6 NA NA
## EXPECTED.FAMILY.CONTRIBUTION..EFC. HOUS.ARRANGE..HEPC.LIV.ARRANGES.CODE.
## 1 99999998 NA
## 2 4834 NA
## 3 99999998 NA
## 4 2396 NA
## 5 99999998 NA
## 6 21298 NA
## MISSING.HEPC.STU.RECORDS.IND..NULLED. HEPC.STU.FILE.SUB.YEAR..NULLED.
## 1 NA NA
## 2 NA NA
## 3 NA NA
## 4 NA NA
## 5 NA NA
## 6 NA NA
## HEPC.STU.FILE.SUB.TERM..NULLED.
## 1 NA
## 2 NA
## 3 NA
## 4 NA
## 5 NA
## 6 NA
dim(dat)
## [1] 16480 257
#Additional packages
install.packages("dae") #Allows combining factors
## Installing package into '/users/sbranham/R/x86_64-redhat-linux-gnu-library/3.3'
## (as 'lib' is unspecified)
library(dae)
## Loading required package: ggplot2
install.packages("scales")
## Installing package into '/users/sbranham/R/x86_64-redhat-linux-gnu-library/3.3'
## (as 'lib' is unspecified)
## Warning in install.packages("scales"): installation of package 'scales' had
## non-zero exit status
library(scales)
install.packages("gsubfn")
## Installing package into '/users/sbranham/R/x86_64-redhat-linux-gnu-library/3.3'
## (as 'lib' is unspecified)
library(gsubfn)
## Loading required package: proto
## Warning in fun(libname, pkgname): couldn't connect to display ":0"
install.packages("alr4")
## Installing package into '/users/sbranham/R/x86_64-redhat-linux-gnu-library/3.3'
## (as 'lib' is unspecified)
library(alr4)
## Loading required package: car
## Loading required package: effects
## Loading required package: carData
##
## Attaching package: 'carData'
## The following objects are masked from 'package:car':
##
## Guyer, UN, Vocab
## lattice theme set by effectsTheme()
## See ?effectsTheme for details.
#Subpopulations we want to work with
#SubPop 1. First Time Freshman
#Create subset of data with only First Time Freshmen (firstTimeFresh)
firstTimeFresh <- dat[which(dat$GS.ADMIT.TYPE.DESC == "First Time Freshman"),]
dim(firstTimeFresh)
## [1] 8590 257
#Can create other subpopulations if needed (grad students, seniors, etc)
#Dependent variables
#Personal attributes
#1. Gender (studentGender)
studentGender <- as.factor(firstTimeFresh$SEX.CODE)
summary(studentGender)
## F M
## 3922 4668
levels(studentGender)
## [1] "F" "M"
#2. Ethnicity (studentEthn)
studentEthn <- factor(firstTimeFresh$ETHNIC.CODE, labels = c("White", "Black", "Hispanic", "Asian", "Native", "Unknown"))
summary(studentEthn)
## White Black Hispanic Asian Native Unknown NA's
## 3435 446 79 106 16 4464 44
levels(studentEthn)
## [1] "White" "Black" "Hispanic" "Asian" "Native" "Unknown"
#3. Major (degreeF)
degreeF <- firstTimeFresh$GS.DEGREE.DESC
summary(degreeF) #Shows degrees w/ 0 students in it
## Associate of Applied Sci
## 0 98
## Associate of Arts Bachelor Electronic Engr
## 847 2
## Bachelor Engr Tech Bachelor of Applied Science
## 4 0
## Bachelor of Arts Bachelor of Fine Arts
## 2040 113
## Bachelor of Multidisc. Studies Bachelor of Music
## 150 81
## Bachelor of Science Bachelor of Science in Nursing
## 3430 13
## Bachelor of Social Work BS in Aerospace Engineering
## 42 62
## BS in Agriculture BS in Biometric Systems
## 58 11
## BS in Business Administration BS in Chemical Engineering
## 797 51
## BS in Civil Engineering BS in Computer Engineering
## 53 29
## BS in Computer Science BS in Electrical Engineering
## 59 44
## BS in Forestry BS in Industrial Engineering
## 40 37
## BS in Journalism BS in Landscape Architecture
## 238 27
## BS in Mechanical Engineering BS in Mining Engineering
## 63 11
## BS in Petroleum & Natl Gas Eng BS in Physical Education
## 42 17
## BS in Recreation Degree Not Declared
## 17 111
## Doctor of Audiology Doctor of Dental Surgery
## 0 0
## Doctor of Education Doctor of Jurisprudence
## 0 0
## Doctor of Medicine Doctor of Musical Arts
## 0 0
## Doctor of Nursing Practice Doctor of Pharmacy
## 0 0
## Doctor of Philosophy Doctor of Physical Therapy
## 0 0
## Master of Agriculture Master of Arts
## 0 0
## Master of Business Admnstrtn Master of Fine Arts
## 0 0
## Master of Landscape Arc Master of Legal Studies
## 0 0
## Master of Music Master of Occupational Therapy
## 0 0
## Master of Professional Acct Master of Professional Studies
## 0 0
## Master of Public Admnstrtn Master of Public Health
## 0 0
## Master of Science Master of Science in Forestry
## 0 0
## Master of Science in Nursing Master of Social Work
## 0 0
## Master's in Health Sciences MS in Aerospace Engineering
## 0 0
## MS in Chemical Engineering MS in Civil Engineering
## 0 0
## MS in Computer Science MS in Electrical Engineering
## 0 0
## MS in Engineering MS in Industrial Engineering
## 0 0
## MS in Journalism MS in Mechanical Engineering
## 0 0
## MS in Mining Engineering MS in Petrl & Natural Gas Engr
## 0 0
## MS in Software Engineering Regents Bachelor of Arts
## 0 3
degreeF <- factor(degreeF) #Excludes unused levels
summary(degreeF) #All majors have at least 1 student it in
## Associate of Applied Sci Associate of Arts
## 98 847
## Bachelor Electronic Engr Bachelor Engr Tech
## 2 4
## Bachelor of Arts Bachelor of Fine Arts
## 2040 113
## Bachelor of Multidisc. Studies Bachelor of Music
## 150 81
## Bachelor of Science Bachelor of Science in Nursing
## 3430 13
## Bachelor of Social Work BS in Aerospace Engineering
## 42 62
## BS in Agriculture BS in Biometric Systems
## 58 11
## BS in Business Administration BS in Chemical Engineering
## 797 51
## BS in Civil Engineering BS in Computer Engineering
## 53 29
## BS in Computer Science BS in Electrical Engineering
## 59 44
## BS in Forestry BS in Industrial Engineering
## 40 37
## BS in Journalism BS in Landscape Architecture
## 238 27
## BS in Mechanical Engineering BS in Mining Engineering
## 63 11
## BS in Petroleum & Natl Gas Eng BS in Physical Education
## 42 17
## BS in Recreation Degree Not Declared
## 17 111
## Regents Bachelor of Arts
## 3
levels(degreeF)
## [1] "Associate of Applied Sci" "Associate of Arts"
## [3] "Bachelor Electronic Engr" "Bachelor Engr Tech"
## [5] "Bachelor of Arts" "Bachelor of Fine Arts"
## [7] "Bachelor of Multidisc. Studies" "Bachelor of Music"
## [9] "Bachelor of Science" "Bachelor of Science in Nursing"
## [11] "Bachelor of Social Work" "BS in Aerospace Engineering"
## [13] "BS in Agriculture" "BS in Biometric Systems"
## [15] "BS in Business Administration" "BS in Chemical Engineering"
## [17] "BS in Civil Engineering" "BS in Computer Engineering"
## [19] "BS in Computer Science" "BS in Electrical Engineering"
## [21] "BS in Forestry" "BS in Industrial Engineering"
## [23] "BS in Journalism" "BS in Landscape Architecture"
## [25] "BS in Mechanical Engineering" "BS in Mining Engineering"
## [27] "BS in Petroleum & Natl Gas Eng" "BS in Physical Education"
## [29] "BS in Recreation" "Degree Not Declared"
## [31] "Regents Bachelor of Arts"
#4. Type of major (degreeType)
#Some majors are associates, and some are bachelors, want to split assocDegree and bachelDegree and otherDegree
assocDegree1 <- factor(degreeF == "Associate of Applied Sci")
assocDegree2 <- factor(degreeF == "Associate of Arts")
notDecDegree <- factor(degreeF == "Degree Not Declared")
regDegree <- factor(degreeF == "Regents Bachelor of Arts")
degreeType <- fac.combine(list(assocDegree1, assocDegree2, notDecDegree, regDegree))
degreeType <- factor(degreeType, labels = c("Bachelor Degree", "Regent Degree", "Degree Not Declared", "Associate Arts", "Associate Applied Sci"))
summary(degreeType)
## Bachelor Degree Regent Degree Degree Not Declared
## 7531 3 111
## Associate Arts Associate Applied Sci
## 847 98
levels(degreeType)
## [1] "Bachelor Degree" "Regent Degree" "Degree Not Declared"
## [4] "Associate Arts" "Associate Applied Sci"
#Location attributes
#1. Student location by state (studentLoc)
studentLoc <- as.factor(firstTimeFresh$MAIL.STATE)
summary(studentLoc)
## AB AE AK AL AP AR AZ BC CA CO CT DC DE FL
## 0 0 1 1 6 1 4 2 2 44 10 73 93 71 64
## FR GA GU HI IA ID IL IN KS KY LA MA MB MD ME
## 22 38 0 0 6 0 35 13 2 9 2 60 0 778 3
## MI MN MO MP MS MT NB NC ND NE NH NJ NM NV NY
## 19 5 5 0 2 1 0 45 1 1 9 473 1 4 291
## OH OK ON OR PA PQ PR RI SC SD TN TX UT VA VT
## 302 5 4 3 935 0 1 7 21 1 20 50 1 673 8
## WA WI WV WY
## 8 13 4341 0
levels(studentLoc)
## [1] "" "AB" "AE" "AK" "AL" "AP" "AR" "AZ" "BC" "CA" "CO" "CT" "DC" "DE"
## [15] "FL" "FR" "GA" "GU" "HI" "IA" "ID" "IL" "IN" "KS" "KY" "LA" "MA" "MB"
## [29] "MD" "ME" "MI" "MN" "MO" "MP" "MS" "MT" "NB" "NC" "ND" "NE" "NH" "NJ"
## [43] "NM" "NV" "NY" "OH" "OK" "ON" "OR" "PA" "PQ" "PR" "RI" "SC" "SD" "TN"
## [57] "TX" "UT" "VA" "VT" "WA" "WI" "WV" "WY"
studentLoc <- factor(studentLoc) #remove unused levels
summary(studentLoc)
## AE AK AL AP AR AZ BC CA CO CT DC DE FL FR GA
## 1 1 6 1 4 2 2 44 10 73 93 71 64 22 38
## IA IL IN KS KY LA MA MD ME MI MN MO MS MT NC
## 6 35 13 2 9 2 60 778 3 19 5 5 2 1 45
## ND NE NH NJ NM NV NY OH OK ON OR PA PR RI SC
## 1 1 9 473 1 4 291 302 5 4 3 935 1 7 21
## SD TN TX UT VA VT WA WI WV
## 1 20 50 1 673 8 8 13 4341
prop.table(table(studentLoc)) #50% of the students come from WV
## studentLoc
## AE AK AL AP AR
## 0.0001164144 0.0001164144 0.0006984866 0.0001164144 0.0004656577
## AZ BC CA CO CT
## 0.0002328289 0.0002328289 0.0051222352 0.0011641444 0.0084982538
## DC DE FL FR GA
## 0.0108265425 0.0082654249 0.0074505239 0.0025611176 0.0044237485
## IA IL IN KS KY
## 0.0006984866 0.0040745052 0.0015133877 0.0002328289 0.0010477299
## LA MA MD ME MI
## 0.0002328289 0.0069848661 0.0905704307 0.0003492433 0.0022118743
## MN MO MS MT NC
## 0.0005820722 0.0005820722 0.0002328289 0.0001164144 0.0052386496
## ND NE NH NJ NM
## 0.0001164144 0.0001164144 0.0010477299 0.0550640279 0.0001164144
## NV NY OH OK ON
## 0.0004656577 0.0338766007 0.0351571595 0.0005820722 0.0004656577
## OR PA PR RI SC
## 0.0003492433 0.1088474971 0.0001164144 0.0008149010 0.0024447031
## SD TN TX UT VA
## 0.0001164144 0.0023282887 0.0058207218 0.0001164144 0.0783469150
## VT WA WI WV
## 0.0009313155 0.0009313155 0.0015133877 0.5053550640
#2. In and out of state indicator (stateIndicator)
stateIndicator <- factor(studentLoc == "WV", labels = c("Out-of-State", "In-State"))
summary(stateIndicator)
## Out-of-State In-State
## 4249 4341
#3. Proximity indicator (proxStudentType)
#Assumptions:
#In-state students will commute to Morgantown, the furthest out, the more the student will require assistance, after a certain distance, it makes no sense to commute and we can assume the student will move to Morgantown.
#Assume the population from Monongalia will commute
#Assume the population from the following counties will also commute (~1 hour) and should be eligible for additional assistance: Preston, Taylor, Marion
#For all counties outside of this radius we assume would move to Morgantown
#Monongalia == shortCommuteStudent
#Preston, Taylor, Marion == longCommuteStudent
#Every other in-state counties == resStudent
shortCommuteStudent <- factor(firstTimeFresh$MAIL.CNTY.DESC == "Monongalia, WV")
longCommuteStudent <- factor(firstTimeFresh$MAIL.CNTY.DESC == "Preston, WV" | firstTimeFresh$MAIL.CNTY.DESC == "Taylor, WV" | firstTimeFresh$MAIL.CNTY.DESC == "Marion, WV")
summary(shortCommuteStudent) #1529
## FALSE TRUE
## 7061 1529
summary(longCommuteStudent) #227
## FALSE TRUE
## 8363 227
proxStudentType <- fac.combine(list(shortCommuteStudent, longCommuteStudent))
summary(proxStudentType)
## 1 2 3
## 6834 227 1529
proxStudentType <- factor(proxStudentType, labels = c("Res or Out-of-State", "Long Commute", "Short Commute"))
#Affinity
affinityStatus <- as.factor(firstTimeFresh$LEGACY.DESC == "" | firstTimeFresh$LEGACY.DESC == "*No Family Member is Alumnus")
affinityStatus <- factor(affinityStatus, labels = c("Some Affinity", "No Affinity"))
summary(affinityStatus)
## Some Affinity No Affinity
## 3718 4872
#Affordability attributes
expectedFamContrib <- rescale(firstTimeFresh$EXPECTED.TOT.FAM.CONT..EFC, to = c(0,100))
summary(expectedFamContrib)
## Min. 1st Qu. Median Mean 3rd Qu. Max. NA's
## 0.000 1.351 9.965 18.080 25.160 100.000 436
#Academic Achievement attributes
#The academic achievement variables from the data are:
#HIGH.SCHOOL.GPA
#PREVIOUS.COLL.GPA
#HIGHEST.ACT.SUM.OF.STANDARD.SCORES
#SAT.TOTAL..HIGHEST.SMV.
#GED.SCORE
#Not all of these variables are ready for analysis, so this section will work on checking through each academic achievement variable and getting it ready.
#HIGH.SCHOOL.GPA
#go ahead and Weight the Unweighted HIGH.SCHOOL.GPAs from 0 to 5.0 instead of 0 to 4.0 while referencing WEIGHTED.GPA.IND variable.
highSchoolGPA <- ifelse((firstTimeFresh$WEIGHTED.GPA.IND=="NW") & (firstTimeFresh$HIGH.SCHOOL.GPA <=4), firstTimeFresh$HIGH.SCHOOL.GPA * 1.25, ifelse(firstTimeFresh$WEIGHTED.GPA.IND == "W", firstTimeFresh$HIGH.SCHOOL.GPA * 1, NA))
#PREVIOUS.COLL.GPA
#Need to mark the values that are greater than 4.0 as NA. This is invalid information.
prevColGPA <- ifelse((firstTimeFresh$PREVIOUS.COLL.GPA > 4), NA, firstTimeFresh$PREVIOUS.COLL.GPA)
#HIGHEST.ACT.SUM.OF.STANDARD.SCORES
highestACT <- firstTimeFresh$HIGHEST.ACT.SUM.OF.STANDARD.SCORES
#SAT.TOTAL..HIGHEST.SMV.
totalSAT <- firstTimeFresh$SAT.TOTAL..HIGHEST.SMV.
#GED.SCORE
#remove the "G" from GED.SCORE to create a numeric value for scaling
scoreGED <- gsub("G", "", firstTimeFresh$GED.SCORE)
scoreGED <- as.numeric(as.character(scoreGED))
summary(scoreGED) # worked. Values 0 to 75.
## Min. 1st Qu. Median Mean 3rd Qu. Max. NA's
## 0.00 51.00 55.00 55.44 61.00 75.00 8425
#The 5 academic variables that we will use are:
#highSchoolGPA - Values 1.25 to 5.00
#prevColGPA - Values 0.00 to 4.00
#highestACT - Values 33 to 142
#totalSAT - Values 305 to 1600
#scoreGED - Values 0 to 75.
#Now that we have the 5 academic achievement variables formatted properly, we can scale the academic variables from 0 to 100 to create an even scale.
highSchoolGPA <- rescale(highSchoolGPA, to = c(1,100))
prevColGPA <- rescale(prevColGPA, to = c(1,100))
highestACT <- rescale(highestACT, to = c(1,100))
totalSAT <- rescale(totalSAT, to = c(1,100))
scoreGED <- rescale(scoreGED, to = c(1,100))
#The 5 academic achievement variables are now each on a percentile scale of 0 to 100. We just need to get the (count of which 5 academic variables in each row that are not NA) and use this to divide the (sum of the 5 academic variables in each row) to create the SCALED.ACADEMIC.ACHIEVEMENT variable that will be between 0 to 100 for each student.
# First Sum the 5 variables together
academAchievSum <- cbind.data.frame(highSchoolGPA, prevColGPA, highestACT, totalSAT, scoreGED)
academAchiev <- rowSums(academAchievSum[, c("highSchoolGPA", "prevColGPA", "highestACT", "totalSAT", "scoreGED")], na.rm = TRUE)
summary(academAchiev)
## Min. 1st Qu. Median Mean 3rd Qu. Max.
## 0.0 157.0 205.4 204.3 252.0 413.7
#Second get a count of NAs within the 5 variables by row.
countNA <- rowSums(is.na(academAchievSum[, c("highSchoolGPA", "prevColGPA", "highestACT", "totalSAT", "scoreGED")]))
summary(countNA)
## Min. 1st Qu. Median Mean 3rd Qu. Max.
## 0.000 1.000 2.000 1.856 2.000 5.000
#Create the SCALED.ACADEMIC.ACHIEVEMENT variable
scaledAcademAchiev <- academAchiev / (5 - countNA)
summary(scaledAcademAchiev)
## Min. 1st Qu. Median Mean 3rd Qu. Max. NA's
## 13.60 57.17 65.44 64.69 72.64 100.00 1
#Independent variables
#Define 21 different grant types - this code only works for FTF, rework the code later to be able to work with any subpopulation we want
#Federal aid
fedDirLoan_unsub <- firstTimeFresh$FED.DIRECT.LOAN....UNSUBSIDIZED
fedDirLoan_sub <- firstTimeFresh$FED.DIRECT.LOAN....SUBSIDIZED
fedDirPlus <- firstTimeFresh$FED.DIRECT.PLUS
fedPellGrant <- firstTimeFresh$FED.PELL.GRANT
fedSupOpp <- firstTimeFresh$FED.SUPPL.ED.OPP
fedOther <- firstTimeFresh$OTHER.FED.GRANTS.AND.SCHOLARS + firstTimeFresh$OTHER.FED.LOANS
#Misc grants
miscGrants <- firstTimeFresh$MISC.GRANTS.AND.SCHOLARS
outOfStateGrant <- firstTimeFresh$OUT.OF.STATE.GRANTS.AND.SCHOLARS
medStudLoan <- firstTimeFresh$MED.STUDENT.LOAN
#WVU grants
rule49Grant <- firstTimeFresh$PROC..RULE.NO..49.GR...PR.TUI.FEE.WAIVS + firstTimeFresh$PROC..RULE.NO..49.UG.TUI.FEE.WAIV.ACAD + firstTimeFresh$PROC..RULE.NO..49.UG.TUI.FEE.WAIV.ATHL + firstTimeFresh$PROC..RULE.NO..49.UG.TUI.FEE.WAIV.NEED...OTHER
instEmployAid <- firstTimeFresh$INST.EMPLOYMENT
instGrantAcademic <- firstTimeFresh$INST.GRANTS.AND.SCHOLARS.ACADEMIC
instGrantAthletic <- firstTimeFresh$INST.GRANTS.AND.SCHOLARS.ATHLETIC
instGrantOther <- firstTimeFresh$INST.GRANTS.AND.SCHOLARS.OTHER
#West Virgina (state) grants
wvHigherEdGrant <- firstTimeFresh$WV.HIGHER.ED.GRANT.PROG
promScholars <- firstTimeFresh$PROMISE.SCHOLARS
wvOther <- firstTimeFresh$OTHER.WV.STATE.GRANTS.AND.SCHOLARS
#Build our data of independent and dependent variables
#WVU financial aid variables - will have to be combined into 1 independent variable
finDataTableWVU <- cbind.data.frame(rule49Grant, instEmployAid, instGrantAcademic, instGrantAthletic, instGrantOther)
#Calculate total WVU award pool
totalAwardWVU <- rule49Grant + instEmployAid + instGrantAcademic + instGrantAthletic + instGrantOther
sum(totalAwardWVU)
## [1] 18510879
#The total WVU award amount for the years 2013-14 for first time freshman is 18.5$MM
#Calculate total non WVU award pool
totalAwardnonWVU <- fedDirLoan_unsub + fedDirLoan_sub + fedDirPlus + fedPellGrant + fedSupOpp + fedOther + miscGrants + outOfStateGrant + medStudLoan + wvHigherEdGrant + promScholars + wvOther
sum(totalAwardnonWVU) #66.5$MM
## [1] 66540034
#Calculate Promise Scholar award
totalAwardScholar <- promScholars
sum(totalAwardScholar) #7.5$MM
## [1] 7508903
#Add the dependent variables to finDataTable
studentGender -> finDataTableWVU$studentGender
studentEthn -> finDataTableWVU$studentEthn
degreeF -> finDataTableWVU$degreeF
degreeType -> finDataTableWVU$degreeType
studentLoc -> finDataTableWVU$studentLoc
stateIndicator -> finDataTableWVU$stateIndicator
proxStudentType -> finDataTableWVU$proxStudentType
highSchoolGPA -> finDataTableWVU$highSchoolGPA
prevColGPA -> finDataTableWVU$prevColGPA
highestACT -> finDataTableWVU$highestACT
totalSAT -> finDataTableWVU$totalSAT
scoreGED -> finDataTableWVU$scoreGED
scaledAcademAchiev -> finDataTableWVU$scaledAcademAchiev
affinityStatus -> finDataTableWVU$affinityStatus
expectedFamContrib -> finDataTableWVU$expectedFamContrib
summary(finDataTableWVU)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0 Min. : 0.0 Min. : 0.0 Min. : 0.0
## 1st Qu.: 0 1st Qu.: 0.0 1st Qu.: 0.0 1st Qu.: 0.0
## Median : 0 Median : 0.0 Median : 0.0 Median : 0.0
## Mean : 950 Mean : 189.3 Mean : 526.6 Mean : 301.2
## 3rd Qu.: 0 3rd Qu.: 0.0 3rd Qu.: 0.0 3rd Qu.: 0.0
## Max. :21336 Max. :17233.0 Max. :15603.0 Max. :41170.0
##
## instGrantOther studentGender studentEthn
## Min. : 0.0 F:3922 White :3435
## 1st Qu.: 0.0 M:4668 Black : 446
## Median : 0.0 Hispanic: 79
## Mean : 187.8 Asian : 106
## 3rd Qu.: 0.0 Native : 16
## Max. :9338.0 Unknown :4464
## NA's : 44
## degreeF degreeType
## Bachelor of Science :3430 Bachelor Degree :7531
## Bachelor of Arts :2040 Regent Degree : 3
## Associate of Arts : 847 Degree Not Declared : 111
## BS in Business Administration : 797 Associate Arts : 847
## BS in Journalism : 238 Associate Applied Sci: 98
## Bachelor of Multidisc. Studies: 150
## (Other) :1088
## studentLoc stateIndicator proxStudentType
## WV :4341 Out-of-State:4249 Res or Out-of-State:6834
## PA : 935 In-State :4341 Long Commute : 227
## MD : 778 Short Commute :1529
## VA : 673
## NJ : 473
## OH : 302
## (Other):1088
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 1.00 Min. : 1.00 Min. : 1.00 Min. : 1.00
## 1st Qu.: 58.97 1st Qu.: 73.27 1st Qu.: 45.50 1st Qu.: 45.00
## Median : 73.43 Median : 85.64 Median : 54.59 Median : 52.62
## Mean : 71.21 Mean : 82.45 Mean : 55.49 Mean : 53.08
## 3rd Qu.: 84.87 3rd Qu.: 95.79 3rd Qu.: 64.58 3rd Qu.: 60.23
## Max. :100.00 Max. :100.00 Max. :100.00 Max. :100.00
## NA's :145 NA's :3510 NA's :2074 NA's :1793
## scoreGED scaledAcademAchiev affinityStatus
## Min. : 1.00 Min. : 13.60 Some Affinity:3718
## 1st Qu.: 68.32 1st Qu.: 57.17 No Affinity :4872
## Median : 73.60 Median : 65.44
## Mean : 74.18 Mean : 64.69
## 3rd Qu.: 81.52 3rd Qu.: 72.64
## Max. :100.00 Max. :100.00
## NA's :8425 NA's :1
## expectedFamContrib
## Min. : 0.000
## 1st Qu.: 1.351
## Median : 9.965
## Mean : 18.078
## 3rd Qu.: 25.156
## Max. :100.000
## NA's :436
#add totalAwardWVU, totalAwardnonWVU to our finDataWVU table
totalAwardWVU -> finDataTableWVU$totalAwardWVU
totalAwardnonWVU -> finDataTableWVU$totalAwardnonWVU
totalAwardScholar -> finDataTableWVU$totalAwardPromScholar
summary(finDataTableWVU)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0 Min. : 0.0 Min. : 0.0 Min. : 0.0
## 1st Qu.: 0 1st Qu.: 0.0 1st Qu.: 0.0 1st Qu.: 0.0
## Median : 0 Median : 0.0 Median : 0.0 Median : 0.0
## Mean : 950 Mean : 189.3 Mean : 526.6 Mean : 301.2
## 3rd Qu.: 0 3rd Qu.: 0.0 3rd Qu.: 0.0 3rd Qu.: 0.0
## Max. :21336 Max. :17233.0 Max. :15603.0 Max. :41170.0
##
## instGrantOther studentGender studentEthn
## Min. : 0.0 F:3922 White :3435
## 1st Qu.: 0.0 M:4668 Black : 446
## Median : 0.0 Hispanic: 79
## Mean : 187.8 Asian : 106
## 3rd Qu.: 0.0 Native : 16
## Max. :9338.0 Unknown :4464
## NA's : 44
## degreeF degreeType
## Bachelor of Science :3430 Bachelor Degree :7531
## Bachelor of Arts :2040 Regent Degree : 3
## Associate of Arts : 847 Degree Not Declared : 111
## BS in Business Administration : 797 Associate Arts : 847
## BS in Journalism : 238 Associate Applied Sci: 98
## Bachelor of Multidisc. Studies: 150
## (Other) :1088
## studentLoc stateIndicator proxStudentType
## WV :4341 Out-of-State:4249 Res or Out-of-State:6834
## PA : 935 In-State :4341 Long Commute : 227
## MD : 778 Short Commute :1529
## VA : 673
## NJ : 473
## OH : 302
## (Other):1088
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 1.00 Min. : 1.00 Min. : 1.00 Min. : 1.00
## 1st Qu.: 58.97 1st Qu.: 73.27 1st Qu.: 45.50 1st Qu.: 45.00
## Median : 73.43 Median : 85.64 Median : 54.59 Median : 52.62
## Mean : 71.21 Mean : 82.45 Mean : 55.49 Mean : 53.08
## 3rd Qu.: 84.87 3rd Qu.: 95.79 3rd Qu.: 64.58 3rd Qu.: 60.23
## Max. :100.00 Max. :100.00 Max. :100.00 Max. :100.00
## NA's :145 NA's :3510 NA's :2074 NA's :1793
## scoreGED scaledAcademAchiev affinityStatus
## Min. : 1.00 Min. : 13.60 Some Affinity:3718
## 1st Qu.: 68.32 1st Qu.: 57.17 No Affinity :4872
## Median : 73.60 Median : 65.44
## Mean : 74.18 Mean : 64.69
## 3rd Qu.: 81.52 3rd Qu.: 72.64
## Max. :100.00 Max. :100.00
## NA's :8425 NA's :1
## expectedFamContrib totalAwardWVU totalAwardnonWVU
## Min. : 0.000 Min. : 0.0 Min. : 0
## 1st Qu.: 1.351 1st Qu.: 0.0 1st Qu.: 0
## Median : 9.965 Median : 447.5 Median : 5444
## Mean : 18.078 Mean : 2154.9 Mean : 7746
## 3rd Qu.: 25.156 3rd Qu.: 3000.0 3rd Qu.:12645
## Max. :100.000 Max. :43560.0 Max. :44595
## NA's :436
## totalAwardPromScholar
## Min. : 0.0
## 1st Qu.: 0.0
## Median : 0.0
## Mean : 874.1
## 3rd Qu.: 0.0
## Max. :7125.0
##
names(finDataTableWVU)
## [1] "rule49Grant" "instEmployAid"
## [3] "instGrantAcademic" "instGrantAthletic"
## [5] "instGrantOther" "studentGender"
## [7] "studentEthn" "degreeF"
## [9] "degreeType" "studentLoc"
## [11] "stateIndicator" "proxStudentType"
## [13] "highSchoolGPA" "prevColGPA"
## [15] "highestACT" "totalSAT"
## [17] "scoreGED" "scaledAcademAchiev"
## [19] "affinityStatus" "expectedFamContrib"
## [21] "totalAwardWVU" "totalAwardnonWVU"
## [23] "totalAwardPromScholar"
#Identify subset of students that received WVU aid, Other aid, are Promise students
aidStudentWVU <- factor(finDataTableWVU$totalAwardWVU > 0, labels = c("Did not received WVU aid", "Received WVU aid"))
aidStudentnonWVU <- factor(finDataTableWVU$totalAwardnonWVU > 0, labels = c("Did not received other aid", "Received other aid"))
aidStudentPromScholar <- factor(finDataTableWVU$totalAwardPromScholar > 0, labels = c("Is not Promise", "Is Promise"))
aidStudentWVU -> finDataTableWVU$aidStudentWVU
aidStudentnonWVU -> finDataTableWVU$aidStudentnonWVU
aidStudentPromScholar -> finDataTableWVU$aidStudentPromScholar
#create new table with only students that have been awarded > 4000
finDataTableWVU_AL1 <- subset(finDataTableWVU, totalAwardWVU > 40000)
summary(finDataTableWVU_AL1)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. :0 Min. :0 Min. : 0 Min. :38293
## 1st Qu.:0 1st Qu.:0 1st Qu.: 0 1st Qu.:40037
## Median :0 Median :0 Median :3000 Median :40308
## Mean :0 Mean :0 Mean :1800 Mean :40074
## 3rd Qu.:0 3rd Qu.:0 3rd Qu.:3000 3rd Qu.:40560
## Max. :0 Max. :0 Max. :3000 Max. :41170
##
## instGrantOther studentGender studentEthn
## Min. :0 F:1 White :1
## 1st Qu.:0 M:4 Black :0
## Median :0 Hispanic:0
## Mean :0 Asian :0
## 3rd Qu.:0 Native :0
## Max. :0 Unknown :4
##
## degreeF degreeType studentLoc
## Bachelor of Science :3 Bachelor Degree :5 WV :4
## Bachelor of Arts :1 Regent Degree :0 GA :1
## BS in Business Administration:1 Degree Not Declared :0 AE :0
## Associate of Applied Sci :0 Associate Arts :0 AK :0
## Associate of Arts :0 Associate Applied Sci:0 AL :0
## Bachelor Electronic Engr :0 AP :0
## (Other) :0 (Other):0
## stateIndicator proxStudentType highSchoolGPA
## Out-of-State:1 Res or Out-of-State:1 Min. :55.88
## In-State :4 Long Commute :0 1st Qu.:66.91
## Short Commute :4 Median :71.75
## Mean :69.45
## 3rd Qu.:75.25
## Max. :77.47
##
## prevColGPA highestACT totalSAT scoreGED
## Min. :87.62 Min. :42.78 Min. :42.46 Min. : NA
## 1st Qu.:87.62 1st Qu.:53.22 1st Qu.:52.62 1st Qu.: NA
## Median :87.62 Median :63.67 Median :57.69 Median : NA
## Mean :87.62 Mean :59.73 Mean :57.35 Mean :NaN
## 3rd Qu.:87.62 3rd Qu.:68.21 3rd Qu.:64.46 3rd Qu.: NA
## Max. :87.62 Max. :72.75 Max. :69.54 Max. : NA
## NA's :4 NA's :2 NA's :5
## scaledAcademAchiev affinityStatus expectedFamContrib
## Min. :62.58 Some Affinity:1 Min. : 0.000
## 1st Qu.:63.03 No Affinity :4 1st Qu.: 9.144
## Median :63.93 Median : 18.287
## Mean :64.53 Mean : 39.429
## 3rd Qu.:65.69 3rd Qu.: 59.144
## Max. :67.40 Max. :100.000
## NA's :2
## totalAwardWVU totalAwardnonWVU totalAwardPromScholar
## Min. :40037 Min. : 0 Min. :0
## 1st Qu.:41170 1st Qu.: 0 1st Qu.:0
## Median :41293 Median : 0 Median :0
## Mean :41874 Mean :1129 Mean :0
## 3rd Qu.:43308 3rd Qu.: 0 3rd Qu.:0
## Max. :43560 Max. :5645 Max. :0
##
## aidStudentWVU aidStudentnonWVU
## Did not received WVU aid:0 Did not received other aid:4
## Received WVU aid :5 Received other aid :1
##
##
##
##
##
## aidStudentPromScholar
## Is not Promise:5
## Is Promise :0
##
##
##
##
##
#AL2
finDataTableWVU_AL2 <- subset(finDataTableWVU, totalAwardWVU > 20000 & totalAwardWVU <= 40000)
summary(finDataTableWVU_AL2)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0 Min. : 0 Min. : 0 Min. : 0
## 1st Qu.: 0 1st Qu.: 0 1st Qu.: 0 1st Qu.:10846
## Median : 0 Median : 0 Median : 0 Median :26770
## Mean : 4030 Mean : 1712 Mean : 1170 Mean :22643
## 3rd Qu.: 7562 3rd Qu.: 170 3rd Qu.: 3000 3rd Qu.:35444
## Max. :21336 Max. :17233 Max. :11938 Max. :39812
##
## instGrantOther studentGender studentEthn
## Min. : 0.0 F:39 White :23
## 1st Qu.: 0.0 M:38 Black :14
## Median : 0.0 Hispanic: 0
## Mean : 458.9 Asian : 2
## 3rd Qu.: 0.0 Native : 1
## Max. :9338.0 Unknown :37
##
## degreeF degreeType
## Bachelor of Arts :32 Bachelor Degree :77
## Bachelor of Science :30 Regent Degree : 0
## BS in Business Administration: 5 Degree Not Declared : 0
## Bachelor of Fine Arts : 2 Associate Arts : 0
## BS in Aerospace Engineering : 2 Associate Applied Sci: 0
## BS in Journalism : 2
## (Other) : 4
## studentLoc stateIndicator proxStudentType
## WV :35 Out-of-State:42 Res or Out-of-State:43
## PA : 7 In-State :35 Long Commute : 0
## GA : 5 Short Commute :34
## TX : 4
## MD : 3
## FL : 2
## (Other):21
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 21.98 Min. : 51.24 Min. :23.71 Min. :23.85
## 1st Qu.: 62.34 1st Qu.: 69.19 1st Qu.:41.87 1st Qu.:43.94
## Median : 73.10 Median : 86.02 Median :56.40 Median :55.15
## Mean : 72.42 Mean : 82.17 Mean :56.33 Mean :56.11
## 3rd Qu.: 88.57 3rd Qu.: 96.53 3rd Qu.:67.76 3rd Qu.:67.85
## Max. :100.00 Max. :100.00 Max. :84.56 Max. :95.77
## NA's :1 NA's :31 NA's :26 NA's :9
## scoreGED scaledAcademAchiev affinityStatus
## Min. :72.28 Min. :31.59 Some Affinity:30
## 1st Qu.:72.28 1st Qu.:57.53 No Affinity :47
## Median :72.28 Median :67.04
## Mean :72.28 Mean :65.54
## 3rd Qu.:72.28 3rd Qu.:75.57
## Max. :72.28 Max. :87.51
## NA's :76
## expectedFamContrib totalAwardWVU totalAwardnonWVU totalAwardPromScholar
## Min. : 0.000 Min. :20191 Min. : 0 Min. :0
## 1st Qu.: 0.000 1st Qu.:23520 1st Qu.: 0 1st Qu.:0
## Median : 2.321 Median :30346 Median : 0 Median :0
## Mean : 12.848 Mean :30014 Mean : 2388 Mean :0
## 3rd Qu.: 17.799 3rd Qu.:36555 3rd Qu.: 5444 3rd Qu.:0
## Max. :100.000 Max. :39812 Max. :11339 Max. :0
## NA's :11
## aidStudentWVU aidStudentnonWVU
## Did not received WVU aid: 0 Did not received other aid:45
## Received WVU aid :77 Received other aid :32
##
##
##
##
##
## aidStudentPromScholar
## Is not Promise:77
## Is Promise : 0
##
##
##
##
##
#AL3
finDataTableWVU_AL3 <- subset(finDataTableWVU, totalAwardWVU > 10000 & totalAwardWVU <= 20000)
summary(finDataTableWVU_AL3)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0 Min. : 0 Min. : 0 Min. : 0
## 1st Qu.: 800 1st Qu.: 0 1st Qu.: 0 1st Qu.: 0
## Median : 8336 Median : 0 Median : 0 Median : 0
## Mean : 7239 Mean : 2358 Mean : 1799 Mean : 1425
## 3rd Qu.:12500 3rd Qu.: 2040 3rd Qu.: 3000 3rd Qu.: 0
## Max. :18000 Max. :14982 Max. :15603 Max. :19771
##
## instGrantOther studentGender studentEthn
## Min. : 0.0 F:116 White : 75
## 1st Qu.: 0.0 M:140 Black : 21
## Median : 0.0 Hispanic: 4
## Mean : 744.4 Asian : 3
## 3rd Qu.: 0.0 Native : 1
## Max. :9338.0 Unknown :151
## NA's : 1
## degreeF degreeType
## Bachelor of Science :108 Bachelor Degree :251
## Bachelor of Arts : 54 Regent Degree : 0
## BS in Business Administration: 21 Degree Not Declared : 0
## BS in Mechanical Engineering : 10 Associate Arts : 5
## Bachelor of Music : 8 Associate Applied Sci: 0
## BS in Chemical Engineering : 6
## (Other) : 49
## studentLoc stateIndicator proxStudentType
## WV :72 Out-of-State:184 Res or Out-of-State:209
## PA :47 In-State : 72 Long Commute : 3
## MD :35 Short Commute : 44
## VA :21
## OH :17
## FR : 8
## (Other):56
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 14.18 Min. : 31.94 Min. :19.17 Min. :11.15
## 1st Qu.: 73.10 1st Qu.: 75.25 1st Qu.:50.95 1st Qu.:51.77
## Median : 79.49 Median : 86.76 Median :61.85 Median :65.31
## Mean : 79.49 Mean : 84.34 Mean :62.66 Mean :63.98
## 3rd Qu.: 91.63 3rd Qu.: 96.91 3rd Qu.:79.11 3rd Qu.:77.15
## Max. :100.00 Max. :100.00 Max. :99.09 Max. :95.77
## NA's :5 NA's :92 NA's :72 NA's :32
## scoreGED scaledAcademAchiev affinityStatus
## Min. :72.28 Min. :23.03 Some Affinity:109
## 1st Qu.:78.22 1st Qu.:66.62 No Affinity :147
## Median :80.86 Median :72.78
## Mean :79.54 Mean :72.43
## 3rd Qu.:82.18 3rd Qu.:79.80
## Max. :84.16 Max. :95.78
## NA's :252
## expectedFamContrib totalAwardWVU totalAwardnonWVU totalAwardPromScholar
## Min. : 0.000 Min. :10005 Min. : 0 Min. : 0.0
## 1st Qu.: 3.469 1st Qu.:11697 1st Qu.: 0 1st Qu.: 0.0
## Median : 12.600 Median :12902 Median : 4750 Median : 0.0
## Mean : 18.589 Mean :13565 Mean : 5869 Mean : 610.6
## 3rd Qu.: 25.107 3rd Qu.:15500 3rd Qu.:10274 3rd Qu.: 0.0
## Max. :100.000 Max. :20000 Max. :22603 Max. :4750.0
## NA's :21
## aidStudentWVU aidStudentnonWVU
## Did not received WVU aid: 0 Did not received other aid: 93
## Received WVU aid :256 Received other aid :163
##
##
##
##
##
## aidStudentPromScholar
## Is not Promise:223
## Is Promise : 33
##
##
##
##
##
#AL4
finDataTableWVU_AL4 <- subset(finDataTableWVU, totalAwardWVU > 5000 & totalAwardWVU <= 10000)
summary(finDataTableWVU_AL4)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0 Min. : 0.0 Min. : 0 Min. : 0.0
## 1st Qu.: 0 1st Qu.: 0.0 1st Qu.: 0 1st Qu.: 0.0
## Median : 4000 Median : 0.0 Median : 0 Median : 0.0
## Mean : 3705 Mean : 612.7 Mean :1439 Mean : 333.3
## 3rd Qu.: 6000 3rd Qu.: 0.0 3rd Qu.:3000 3rd Qu.: 0.0
## Max. :10000 Max. :9258.0 Max. :9600 Max. :9088.0
##
## instGrantOther studentGender studentEthn
## Min. : 0 F:281 White :209
## 1st Qu.: 0 M:346 Black : 31
## Median : 0 Hispanic: 3
## Mean :1045 Asian : 8
## 3rd Qu.:2000 Native : 0
## Max. :7392 Unknown :372
## NA's : 4
## degreeF degreeType
## Bachelor of Science :300 Bachelor Degree :599
## Bachelor of Arts :127 Regent Degree : 0
## BS in Business Administration: 55 Degree Not Declared : 6
## Associate of Arts : 20 Associate Arts : 20
## BS in Journalism : 20 Associate Applied Sci: 2
## Bachelor of Music : 14
## (Other) : 91
## studentLoc stateIndicator proxStudentType
## WV :223 Out-of-State:404 Res or Out-of-State:494
## PA :118 In-State :223 Long Commute : 15
## MD : 57 Short Commute :118
## VA : 50
## NJ : 37
## OH : 27
## (Other):115
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 15.26 Min. : 1.00 Min. : 10.99 Min. :19.62
## 1st Qu.: 69.26 1st Qu.: 75.00 1st Qu.: 50.95 1st Qu.:51.77
## Median : 76.60 Median : 86.64 Median : 62.76 Median :60.23
## Mean : 76.34 Mean : 83.81 Mean : 62.22 Mean :59.29
## 3rd Qu.: 87.56 3rd Qu.: 96.29 3rd Qu.: 73.66 3rd Qu.:68.69
## Max. :100.00 Max. :100.00 Max. :100.00 Max. :94.92
## NA's :19 NA's :264 NA's :141 NA's :87
## scoreGED scaledAcademAchiev affinityStatus
## Min. :63.04 Min. :29.35 Some Affinity:243
## 1st Qu.:69.64 1st Qu.:63.29 No Affinity :384
## Median :73.60 Median :70.57
## Mean :76.14 Mean :69.42
## 3rd Qu.:80.20 3rd Qu.:76.47
## Max. :94.72 Max. :98.31
## NA's :614
## expectedFamContrib totalAwardWVU totalAwardnonWVU totalAwardPromScholar
## Min. : 0.000 Min. : 5025 Min. : 0 Min. : 0
## 1st Qu.: 2.281 1st Qu.: 6000 1st Qu.: 653 1st Qu.: 0
## Median : 9.772 Median : 6903 Median : 6434 Median : 0
## Mean : 18.779 Mean : 7135 Mean : 8578 Mean : 922
## 3rd Qu.: 27.067 3rd Qu.: 8422 3rd Qu.:13458 3rd Qu.: 0
## Max. :100.000 Max. :10000 Max. :33239 Max. :4750
## NA's :14
## aidStudentWVU aidStudentnonWVU
## Did not received WVU aid: 0 Did not received other aid:151
## Received WVU aid :627 Received other aid :476
##
##
##
##
##
## aidStudentPromScholar
## Is not Promise:505
## Is Promise :122
##
##
##
##
##
#AL5
finDataTableWVU_AL5 <- subset(finDataTableWVU, totalAwardWVU > 1000 & totalAwardWVU <= 5000)
summary(finDataTableWVU_AL5)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0 Min. : 0.0 Min. : 0 Min. : 0.00
## 1st Qu.: 0 1st Qu.: 0.0 1st Qu.: 0 1st Qu.: 0.00
## Median : 0 Median : 0.0 Median : 0 Median : 0.00
## Mean :1420 Mean : 184.7 Mean :1060 Mean : 27.01
## 3rd Qu.:3000 3rd Qu.: 0.0 3rd Qu.:2000 3rd Qu.: 0.00
## Max. :5000 Max. :4996.0 Max. :5000 Max. :4866.00
##
## instGrantOther studentGender studentEthn
## Min. : 0.0 F:1111 White : 913
## 1st Qu.: 0.0 M:1390 Black : 79
## Median : 0.0 Hispanic: 21
## Mean : 244.9 Asian : 28
## 3rd Qu.: 0.0 Native : 4
## Max. :5000.0 Unknown :1446
## NA's : 10
## degreeF degreeType
## Bachelor of Science :1133 Bachelor Degree :2329
## Bachelor of Arts : 578 Regent Degree : 0
## BS in Business Administration: 241 Degree Not Declared : 22
## Associate of Arts : 142 Associate Arts : 142
## BS in Journalism : 71 Associate Applied Sci: 8
## Bachelor of Music : 36
## (Other) : 300
## studentLoc stateIndicator proxStudentType
## WV :1327 Out-of-State:1174 Res or Out-of-State:1970
## PA : 327 In-State :1327 Long Commute : 62
## MD : 214 Short Commute : 469
## VA : 169
## NJ : 136
## OH : 106
## (Other): 222
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 8.264 Min. : 1.00 Min. :11.90 Min. : 1.00
## 1st Qu.: 69.062 1st Qu.: 75.25 1st Qu.:50.95 1st Qu.: 50.92
## Median : 78.142 Median : 87.13 Median :59.13 Median : 56.00
## Mean : 77.291 Mean : 83.91 Mean :59.25 Mean : 55.95
## 3rd Qu.: 88.903 3rd Qu.: 96.53 3rd Qu.:67.30 3rd Qu.: 62.77
## Max. :100.000 Max. :100.00 Max. :97.28 Max. :100.00
## NA's :39 NA's :973 NA's :493 NA's :435
## scoreGED scaledAcademAchiev affinityStatus
## Min. : 61.72 Min. : 23.36 Some Affinity:1107
## 1st Qu.: 67.99 1st Qu.: 62.47 No Affinity :1394
## Median : 77.56 Median : 69.09
## Mean : 78.31 Mean : 68.55
## 3rd Qu.: 86.47 3rd Qu.: 75.07
## Max. :100.00 Max. :100.00
## NA's :2471
## expectedFamContrib totalAwardWVU totalAwardnonWVU totalAwardPromScholar
## Min. : 0.000 Min. :1004 Min. : 0 Min. : 0
## 1st Qu.: 3.889 1st Qu.:2000 1st Qu.: 2420 1st Qu.: 0
## Median : 14.668 Median :3000 Median : 5880 Median : 0
## Mean : 22.274 Mean :2937 Mean : 8504 Mean :1777
## 3rd Qu.: 31.640 3rd Qu.:4000 3rd Qu.:13245 3rd Qu.:4750
## Max. :100.000 Max. :5000 Max. :42328 Max. :7125
## NA's :73
## aidStudentWVU aidStudentnonWVU
## Did not received WVU aid: 0 Did not received other aid: 548
## Received WVU aid :2501 Received other aid :1953
##
##
##
##
##
## aidStudentPromScholar
## Is not Promise:1541
## Is Promise : 960
##
##
##
##
##
#AL6
finDataTableWVU_AL6 <- subset(finDataTableWVU, totalAwardWVU > 500 & totalAwardWVU <= 1000)
summary(finDataTableWVU_AL6)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0.0 Min. : 0.00 Min. : 0 Min. : 0.00
## 1st Qu.: 0.0 1st Qu.: 0.00 1st Qu.: 0 1st Qu.: 0.00
## Median : 0.0 Median : 0.00 Median : 800 Median : 0.00
## Mean : 183.2 Mean : 54.13 Mean : 551 Mean : 3.46
## 3rd Qu.: 0.0 3rd Qu.: 0.00 3rd Qu.:1000 3rd Qu.: 0.00
## Max. :1000.0 Max. :959.00 Max. :1000 Max. :1000.00
##
## instGrantOther studentGender studentEthn
## Min. : 0 F:342 White :266
## 1st Qu.: 0 M:236 Black : 16
## Median : 0 Hispanic: 3
## Mean : 153 Asian : 3
## 3rd Qu.: 0 Native : 2
## Max. :1000 Unknown :286
## NA's : 2
## degreeF degreeType
## Bachelor of Science :216 Bachelor Degree :453
## Bachelor of Arts :117 Regent Degree : 0
## Associate of Arts : 99 Degree Not Declared : 14
## BS in Business Administration: 41 Associate Arts : 99
## BS in Journalism : 17 Associate Applied Sci: 12
## Degree Not Declared : 14
## (Other) : 74
## studentLoc stateIndicator proxStudentType
## WV :421 Out-of-State:157 Res or Out-of-State:460
## MD : 39 In-State :421 Long Commute : 28
## VA : 39 Short Commute : 90
## OH : 24
## PA : 21
## NY : 8
## (Other): 26
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 31.40 Min. : 32.19 Min. :15.53 Min. :12.85
## 1st Qu.: 70.41 1st Qu.: 75.25 1st Qu.:47.32 1st Qu.:42.46
## Median : 81.50 Median : 86.14 Median :51.86 Median :50.08
## Mean : 78.58 Mean : 83.27 Mean :51.89 Mean :50.45
## 3rd Qu.: 90.50 3rd Qu.: 94.31 3rd Qu.:55.50 3rd Qu.:56.85
## Max. :100.00 Max. :100.00 Max. :85.47 Max. :89.85
## NA's :12 NA's :197 NA's :106 NA's :136
## scoreGED scaledAcademAchiev affinityStatus
## Min. :73.60 Min. : 31.40 Some Affinity:252
## 1st Qu.:75.58 1st Qu.: 60.61 No Affinity :326
## Median :76.90 Median : 66.90
## Mean :78.06 Mean : 66.05
## 3rd Qu.:80.86 3rd Qu.: 72.36
## Max. :84.16 Max. :100.00
## NA's :570
## expectedFamContrib totalAwardWVU totalAwardnonWVU
## Min. : 0.000 Min. : 504.0 Min. : 0
## 1st Qu.: 1.358 1st Qu.:1000.0 1st Qu.: 4750
## Median : 7.347 Median :1000.0 Median : 8995
## Mean : 16.065 Mean : 944.7 Mean : 9562
## 3rd Qu.: 22.922 3rd Qu.:1000.0 3rd Qu.:13839
## Max. :100.000 Max. :1000.0 Max. :40333
## NA's :6
## totalAwardPromScholar aidStudentWVU
## Min. : 0 Did not received WVU aid: 0
## 1st Qu.: 0 Received WVU aid :578
## Median : 0
## Mean :1860
## 3rd Qu.:4750
## Max. :6980
##
## aidStudentnonWVU aidStudentPromScholar
## Did not received other aid: 59 Is not Promise:335
## Received other aid :519 Is Promise :243
##
##
##
##
##
#AL7
finDataTableWVU_AL7 <- subset(finDataTableWVU, totalAwardWVU > 100 & totalAwardWVU <= 500)
summary(finDataTableWVU_AL7)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0.00 Min. : 0.00 Min. : 0.0 Min. : 0.000
## 1st Qu.: 0.00 1st Qu.: 0.00 1st Qu.: 0.0 1st Qu.: 0.000
## Median : 0.00 Median : 0.00 Median :400.0 Median : 0.000
## Mean : 48.24 Mean : 37.57 Mean :268.5 Mean : 1.173
## 3rd Qu.: 0.00 3rd Qu.: 0.00 3rd Qu.:500.0 3rd Qu.: 0.000
## Max. :500.00 Max. :498.00 Max. :500.0 Max. :400.000
##
## instGrantOther studentGender studentEthn
## Min. : 0.00 F:174 White :147
## 1st Qu.: 0.00 M:167 Black : 7
## Median : 0.00 Hispanic: 0
## Mean : 91.39 Asian : 7
## 3rd Qu.: 0.00 Native : 0
## Max. :500.00 Unknown :178
## NA's : 2
## degreeF degreeType
## Bachelor of Science :131 Bachelor Degree :296
## Bachelor of Arts : 78 Regent Degree : 1
## Associate of Arts : 34 Degree Not Declared : 8
## BS in Business Administration : 31 Associate Arts : 34
## Bachelor of Multidisc. Studies: 16 Associate Applied Sci: 2
## BS in Journalism : 10
## (Other) : 41
## studentLoc stateIndicator proxStudentType
## WV :239 Out-of-State:102 Res or Out-of-State:256
## MD : 27 In-State :239 Long Commute : 16
## PA : 18 Short Commute : 69
## VA : 14
## NJ : 11
## OH : 11
## (Other): 21
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 18.62 Min. : 41.59 Min. :20.98 Min. :12.85
## 1st Qu.: 69.06 1st Qu.: 76.24 1st Qu.:45.50 1st Qu.:44.15
## Median : 80.50 Median : 87.13 Median :52.77 Median :50.08
## Mean : 77.30 Mean : 84.20 Mean :52.87 Mean :51.23
## 3rd Qu.: 88.65 3rd Qu.: 95.79 3rd Qu.:59.13 3rd Qu.:58.54
## Max. :100.00 Max. :100.00 Max. :91.83 Max. :89.00
## NA's :5 NA's :96 NA's :52 NA's :85
## scoreGED scaledAcademAchiev affinityStatus
## Min. : 69.64 Min. :35.94 Some Affinity:193
## 1st Qu.: 73.60 1st Qu.:60.56 No Affinity :148
## Median : 82.84 Median :67.03
## Mean : 82.69 Mean :66.57
## 3rd Qu.: 89.44 3rd Qu.:73.54
## Max. :100.00 Max. :97.15
## NA's :332
## expectedFamContrib totalAwardWVU totalAwardnonWVU totalAwardPromScholar
## Min. : 0.000 Min. :130.0 Min. : 0 Min. : 0
## 1st Qu.: 1.368 1st Qu.:427.0 1st Qu.: 4701 1st Qu.: 0
## Median : 6.792 Median :500.0 Median : 6850 Median : 0
## Mean : 15.298 Mean :446.9 Mean : 8613 Mean :1717
## 3rd Qu.: 18.677 3rd Qu.:500.0 3rd Qu.:12963 3rd Qu.:4750
## Max. :100.000 Max. :500.0 Max. :41917 Max. :4750
## NA's :8
## aidStudentWVU aidStudentnonWVU
## Did not received WVU aid: 0 Did not received other aid: 39
## Received WVU aid :341 Received other aid :302
##
##
##
##
##
## aidStudentPromScholar
## Is not Promise:204
## Is Promise :137
##
##
##
##
##
#AL8
finDataTableWVU_AL8 <- subset(finDataTableWVU, totalAwardWVU > 0 & totalAwardWVU <= 100)
summary(finDataTableWVU_AL8)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. :0 Min. : 0.00 Min. : 0.00 Min. :0
## 1st Qu.:0 1st Qu.: 0.00 1st Qu.: 0.00 1st Qu.:0
## Median :0 Median : 40.00 Median : 0.00 Median :0
## Mean :0 Mean : 36.82 Mean : 23.27 Mean :0
## 3rd Qu.:0 3rd Qu.: 58.00 3rd Qu.: 28.00 3rd Qu.:0
## Max. :0 Max. :100.00 Max. :100.00 Max. :0
##
## instGrantOther studentGender studentEthn
## Min. : 0.000 F:4 White :4
## 1st Qu.: 0.000 M:7 Black :1
## Median : 0.000 Hispanic:0
## Mean : 9.091 Asian :0
## 3rd Qu.: 0.000 Native :0
## Max. :100.000 Unknown :6
##
## degreeF degreeType studentLoc
## Bachelor of Science :4 Bachelor Degree :8 NJ :3
## Bachelor of Arts :3 Regent Degree :0 WV :3
## Associate of Arts :2 Degree Not Declared :0 PA :2
## Associate of Applied Sci :1 Associate Arts :2 MD :1
## BS in Business Administration:1 Associate Applied Sci:1 OH :1
## Bachelor Electronic Engr :0 VA :1
## (Other) :0 (Other):0
## stateIndicator proxStudentType highSchoolGPA
## Out-of-State:8 Res or Out-of-State:11 Min. :32.74
## In-State :3 Long Commute : 0 1st Qu.:45.56
## Short Commute : 0 Median :65.03
## Mean :64.57
## 3rd Qu.:80.50
## Max. :96.64
##
## prevColGPA highestACT totalSAT scoreGED
## Min. : 57.92 Min. :38.24 Min. :33.15 Min. : NA
## 1st Qu.: 85.64 1st Qu.:45.50 1st Qu.:45.85 1st Qu.: NA
## Median : 92.08 Median :54.59 Median :50.08 Median : NA
## Mean : 87.13 Mean :53.78 Mean :51.68 Mean :NaN
## 3rd Qu.:100.00 3rd Qu.:58.22 3rd Qu.:56.00 3rd Qu.: NA
## Max. :100.00 Max. :75.48 Max. :77.15 Max. : NA
## NA's :6 NA's :2 NA's :2 NA's :11
## scaledAcademAchiev affinityStatus expectedFamContrib
## Min. :44.75 Some Affinity:4 Min. : 0.009
## 1st Qu.:55.71 No Affinity :7 1st Qu.: 1.610
## Median :60.66 Median : 5.753
## Mean :62.10 Mean :11.133
## 3rd Qu.:68.76 3rd Qu.: 9.827
## Max. :81.35 Max. :39.594
## NA's :1
## totalAwardWVU totalAwardnonWVU totalAwardPromScholar
## Min. : 25.00 Min. : 0 Min. : 0.0
## 1st Qu.: 57.00 1st Qu.: 4264 1st Qu.: 0.0
## Median : 58.00 Median : 9339 Median : 0.0
## Mean : 69.18 Mean : 9915 Mean : 735.1
## 3rd Qu.:100.00 3rd Qu.:16966 3rd Qu.: 0.0
## Max. :100.00 Max. :19740 Max. :4750.0
##
## aidStudentWVU aidStudentnonWVU
## Did not received WVU aid: 0 Did not received other aid:3
## Received WVU aid :11 Received other aid :8
##
##
##
##
##
## aidStudentPromScholar
## Is not Promise:9
## Is Promise :2
##
##
##
##
##
#Descriptive stats
#create a function to summarize mean of the data
summaryTable <- function(a = NULL, table1 = NULL, list1 = list(studentGender), func = mean) {
table1 <- tapply(a, list1, func)
print(table1)
}
#Student attributes
#studentGender, studentEthn, degreeF, degreeType, studentLoc, stateIndicator, proxStudentType
for(i in 13:15){
print(colnames(finDataTableWVU[i]))
summaryTable(finDataTableWVU[,i], list1, func = mean)
writeLines("")
}
## [1] "highSchoolGPA"
## F M
## NA NA
##
## [1] "prevColGPA"
## F M
## NA NA
##
## [1] "highestACT"
## F M
## NA NA
names(finDataTableWVU)
## [1] "rule49Grant" "instEmployAid"
## [3] "instGrantAcademic" "instGrantAthletic"
## [5] "instGrantOther" "studentGender"
## [7] "studentEthn" "degreeF"
## [9] "degreeType" "studentLoc"
## [11] "stateIndicator" "proxStudentType"
## [13] "highSchoolGPA" "prevColGPA"
## [15] "highestACT" "totalSAT"
## [17] "scoreGED" "scaledAcademAchiev"
## [19] "affinityStatus" "expectedFamContrib"
## [21] "totalAwardWVU" "totalAwardnonWVU"
## [23] "totalAwardPromScholar" "aidStudentWVU"
## [25] "aidStudentnonWVU" "aidStudentPromScholar"
summary(finDataTableWVU)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0 Min. : 0.0 Min. : 0.0 Min. : 0.0
## 1st Qu.: 0 1st Qu.: 0.0 1st Qu.: 0.0 1st Qu.: 0.0
## Median : 0 Median : 0.0 Median : 0.0 Median : 0.0
## Mean : 950 Mean : 189.3 Mean : 526.6 Mean : 301.2
## 3rd Qu.: 0 3rd Qu.: 0.0 3rd Qu.: 0.0 3rd Qu.: 0.0
## Max. :21336 Max. :17233.0 Max. :15603.0 Max. :41170.0
##
## instGrantOther studentGender studentEthn
## Min. : 0.0 F:3922 White :3435
## 1st Qu.: 0.0 M:4668 Black : 446
## Median : 0.0 Hispanic: 79
## Mean : 187.8 Asian : 106
## 3rd Qu.: 0.0 Native : 16
## Max. :9338.0 Unknown :4464
## NA's : 44
## degreeF degreeType
## Bachelor of Science :3430 Bachelor Degree :7531
## Bachelor of Arts :2040 Regent Degree : 3
## Associate of Arts : 847 Degree Not Declared : 111
## BS in Business Administration : 797 Associate Arts : 847
## BS in Journalism : 238 Associate Applied Sci: 98
## Bachelor of Multidisc. Studies: 150
## (Other) :1088
## studentLoc stateIndicator proxStudentType
## WV :4341 Out-of-State:4249 Res or Out-of-State:6834
## PA : 935 In-State :4341 Long Commute : 227
## MD : 778 Short Commute :1529
## VA : 673
## NJ : 473
## OH : 302
## (Other):1088
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 1.00 Min. : 1.00 Min. : 1.00 Min. : 1.00
## 1st Qu.: 58.97 1st Qu.: 73.27 1st Qu.: 45.50 1st Qu.: 45.00
## Median : 73.43 Median : 85.64 Median : 54.59 Median : 52.62
## Mean : 71.21 Mean : 82.45 Mean : 55.49 Mean : 53.08
## 3rd Qu.: 84.87 3rd Qu.: 95.79 3rd Qu.: 64.58 3rd Qu.: 60.23
## Max. :100.00 Max. :100.00 Max. :100.00 Max. :100.00
## NA's :145 NA's :3510 NA's :2074 NA's :1793
## scoreGED scaledAcademAchiev affinityStatus
## Min. : 1.00 Min. : 13.60 Some Affinity:3718
## 1st Qu.: 68.32 1st Qu.: 57.17 No Affinity :4872
## Median : 73.60 Median : 65.44
## Mean : 74.18 Mean : 64.69
## 3rd Qu.: 81.52 3rd Qu.: 72.64
## Max. :100.00 Max. :100.00
## NA's :8425 NA's :1
## expectedFamContrib totalAwardWVU totalAwardnonWVU
## Min. : 0.000 Min. : 0.0 Min. : 0
## 1st Qu.: 1.351 1st Qu.: 0.0 1st Qu.: 0
## Median : 9.965 Median : 447.5 Median : 5444
## Mean : 18.078 Mean : 2154.9 Mean : 7746
## 3rd Qu.: 25.156 3rd Qu.: 3000.0 3rd Qu.:12645
## Max. :100.000 Max. :43560.0 Max. :44595
## NA's :436
## totalAwardPromScholar aidStudentWVU
## Min. : 0.0 Did not received WVU aid:4194
## 1st Qu.: 0.0 Received WVU aid :4396
## Median : 0.0
## Mean : 874.1
## 3rd Qu.: 0.0
## Max. :7125.0
##
## aidStudentnonWVU aidStudentPromScholar
## Did not received other aid:2756 Is not Promise:6945
## Received other aid :5834 Is Promise :1645
##
##
##
##
##
Now deal with the blank values and NA’s on variables within the finDataTableWVU dataset so that we can model these without excluding too many.
finDataTableWVU$highSchoolGPA.NA <- is.na(finDataTableWVU$highSchoolGPA)
finDataTableWVU$prevColGPA.NA <- is.na(finDataTableWVU$prevColGPA)
finDataTableWVU$highestACT.NA <- is.na(finDataTableWVU$highestACT)
finDataTableWVU$totalSAT.NA <- is.na(finDataTableWVU$totalSAT)
finDataTableWVU$scoreGED.NA <- is.na(finDataTableWVU$scoreGED)
finDataTableWVU$expectedFamContrib.NA <- is.na(finDataTableWVU$expectedFamContrib)
finDataTableWVU$studentEthn.NA <-is.na(finDataTableWVU$studentEthn)
finDataTableWVU$scaledAcademAchiev.NA <-is.na(finDataTableWVU$scaledAcademAchiev)
finDataTableWVU$highSchoolGPA[is.na(finDataTableWVU$highSchoolGPA)] = 1
finDataTableWVU$prevColGPA[is.na(finDataTableWVU$prevColGPA)] = 1
finDataTableWVU$highestACT[is.na(finDataTableWVU$highestACT)] = 1
finDataTableWVU$totalSAT[is.na(finDataTableWVU$totalSAT)] = 1
finDataTableWVU$scoreGED[is.na(finDataTableWVU$scoreGED)] = 1
finDataTableWVU$expectedFamContrib[is.na(finDataTableWVU$expectedFamContrib)] = 1
finDataTableWVU$studentEthn[is.na(finDataTableWVU$studentEthn)] = "Unknown"
finDataTableWVU$scaledAcademAchiev[is.na(finDataTableWVU$scaledAcademAchiev)] = 1
summary(finDataTableWVU)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0 Min. : 0.0 Min. : 0.0 Min. : 0.0
## 1st Qu.: 0 1st Qu.: 0.0 1st Qu.: 0.0 1st Qu.: 0.0
## Median : 0 Median : 0.0 Median : 0.0 Median : 0.0
## Mean : 950 Mean : 189.3 Mean : 526.6 Mean : 301.2
## 3rd Qu.: 0 3rd Qu.: 0.0 3rd Qu.: 0.0 3rd Qu.: 0.0
## Max. :21336 Max. :17233.0 Max. :15603.0 Max. :41170.0
##
## instGrantOther studentGender studentEthn
## Min. : 0.0 F:3922 White :3435
## 1st Qu.: 0.0 M:4668 Black : 446
## Median : 0.0 Hispanic: 79
## Mean : 187.8 Asian : 106
## 3rd Qu.: 0.0 Native : 16
## Max. :9338.0 Unknown :4508
##
## degreeF degreeType
## Bachelor of Science :3430 Bachelor Degree :7531
## Bachelor of Arts :2040 Regent Degree : 3
## Associate of Arts : 847 Degree Not Declared : 111
## BS in Business Administration : 797 Associate Arts : 847
## BS in Journalism : 238 Associate Applied Sci: 98
## Bachelor of Multidisc. Studies: 150
## (Other) :1088
## studentLoc stateIndicator proxStudentType
## WV :4341 Out-of-State:4249 Res or Out-of-State:6834
## PA : 935 In-State :4341 Long Commute : 227
## MD : 778 Short Commute :1529
## VA : 673
## NJ : 473
## OH : 302
## (Other):1088
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 1.00 Min. : 1.00 Min. : 1.00 Min. : 1.00
## 1st Qu.: 58.03 1st Qu.: 1.00 1st Qu.: 24.61 1st Qu.: 34.00
## Median : 73.10 Median : 65.84 Median : 50.05 Median : 49.23
## Mean : 70.03 Mean : 49.17 Mean : 42.34 Mean : 42.21
## 3rd Qu.: 84.53 3rd Qu.: 88.86 3rd Qu.: 60.94 3rd Qu.: 58.54
## Max. :100.00 Max. :100.00 Max. :100.00 Max. :100.00
##
## scoreGED scaledAcademAchiev affinityStatus
## Min. : 1.000 Min. : 1.00 Some Affinity:3718
## 1st Qu.: 1.000 1st Qu.: 57.16 No Affinity :4872
## Median : 1.000 Median : 65.43
## Mean : 2.406 Mean : 64.68
## 3rd Qu.: 1.000 3rd Qu.: 72.64
## Max. :100.000 Max. :100.00
##
## expectedFamContrib totalAwardWVU totalAwardnonWVU
## Min. : 0.000 Min. : 0.0 Min. : 0
## 1st Qu.: 1.000 1st Qu.: 0.0 1st Qu.: 0
## Median : 8.654 Median : 447.5 Median : 5444
## Mean : 17.211 Mean : 2154.9 Mean : 7746
## 3rd Qu.: 24.163 3rd Qu.: 3000.0 3rd Qu.:12645
## Max. :100.000 Max. :43560.0 Max. :44595
##
## totalAwardPromScholar aidStudentWVU
## Min. : 0.0 Did not received WVU aid:4194
## 1st Qu.: 0.0 Received WVU aid :4396
## Median : 0.0
## Mean : 874.1
## 3rd Qu.: 0.0
## Max. :7125.0
##
## aidStudentnonWVU aidStudentPromScholar
## Did not received other aid:2756 Is not Promise:6945
## Received other aid :5834 Is Promise :1645
##
##
##
##
##
## highSchoolGPA.NA prevColGPA.NA highestACT.NA totalSAT.NA
## Mode :logical Mode :logical Mode :logical Mode :logical
## FALSE:8445 FALSE:5080 FALSE:6516 FALSE:6797
## TRUE :145 TRUE :3510 TRUE :2074 TRUE :1793
## NA's :0 NA's :0 NA's :0 NA's :0
##
##
##
## scoreGED.NA expectedFamContrib.NA studentEthn.NA
## Mode :logical Mode :logical Mode :logical
## FALSE:165 FALSE:8154 FALSE:8546
## TRUE :8425 TRUE :436 TRUE :44
## NA's :0 NA's :0 NA's :0
##
##
##
## scaledAcademAchiev.NA
## Mode :logical
## FALSE:8589
## TRUE :1
## NA's :0
##
##
##
#model transformation
#To avoid problems with negative values of the response variable, we add 0.5 to all observations
pred <- finDataTableWVU$totalAwardWVU + 0.5
modWVUAid <- lm(sqrt(pred) ~ studentGender + studentEthn + degreeF + proxStudentType + affinityStatus + expectedFamContrib + expectedFamContrib.NA + aidStudentnonWVU + aidStudentWVU + aidStudentPromScholar + affinityStatus + highestACT + highestACT.NA + totalSAT + totalSAT.NA + totalAwardnonWVU + totalAwardPromScholar, data = finDataTableWVU)
require(MASS)
## Loading required package: MASS
bc <- boxcox(modWVUAid)
#The optimal transformation has a parameter close to -2
#find the approximate mle as the x-value that yields the maximum
bc$x[bc$y==max(bc$y)]
## [1] -2
#call the function with a single parameter value to just evaluate the log-likelihood
bc0 <- boxcox(modWVUAid, lambda = 1, plotit = TRUE)
bc1 <- boxcox(modWVUAid, lambda = 0, plotit = TRUE)
bc2 <- boxcox(modWVUAid, lambda = 2, plotit = TRUE)
bc3 <- boxcox(modWVUAid, lambda = -1, plotit = TRUE)
bc4 <- boxcox(modWVUAid, lambda = -2, plotit = TRUE)
TukeyHSD(aov(modWVUAid), ordered = TRUE, conf.level = 0.99, "proxStudentType")
## Warning in replications(paste("~", xx), data = mf): non-factors ignored:
## expectedFamContrib
## Warning in replications(paste("~", xx), data = mf): non-factors ignored:
## expectedFamContrib.NA
## Warning in replications(paste("~", xx), data = mf): non-factors ignored:
## highestACT
## Warning in replications(paste("~", xx), data = mf): non-factors ignored:
## highestACT.NA
## Warning in replications(paste("~", xx), data = mf): non-factors ignored:
## totalSAT
## Warning in replications(paste("~", xx), data = mf): non-factors ignored:
## totalSAT.NA
## Warning in replications(paste("~", xx), data = mf): non-factors ignored:
## totalAwardnonWVU
## Warning in replications(paste("~", xx), data = mf): non-factors ignored:
## totalAwardPromScholar
## Tukey multiple comparisons of means
## 99% family-wise confidence level
## factor levels have been ordered
##
## Fit: aov(formula = modWVUAid)
##
## $proxStudentType
## diff lwr upr p adj
## Res or Out-of-State-Long Commute 3.392833 -0.4377316 7.223397 0.0266593
## Short Commute-Long Commute 5.384912 1.3463602 9.423464 0.0003026
## Short Commute-Res or Out-of-State 1.992079 0.3858042 3.598354 0.0008842
summary(modWVUAid)
##
## Call:
## lm(formula = sqrt(pred) ~ studentGender + studentEthn + degreeF +
## proxStudentType + affinityStatus + expectedFamContrib + expectedFamContrib.NA +
## aidStudentnonWVU + aidStudentWVU + aidStudentPromScholar +
## affinityStatus + highestACT + highestACT.NA + totalSAT +
## totalSAT.NA + totalAwardnonWVU + totalAwardPromScholar, data = finDataTableWVU)
##
## Residuals:
## Min 1Q Median 3Q Max
## -58.876 -7.367 -1.087 4.828 143.313
##
## Coefficients:
## Estimate Std. Error t value
## (Intercept) -2.861e+01 2.429e+00 -11.780
## studentGenderM 1.914e-01 4.366e-01 0.438
## studentEthnBlack 8.897e+00 1.010e+00 8.810
## studentEthnHispanic 2.288e+00 2.223e+00 1.030
## studentEthnAsian 4.584e-01 1.936e+00 0.237
## studentEthnNative 4.875e+00 4.893e+00 0.996
## studentEthnUnknown 1.129e+00 4.583e-01 2.463
## degreeFAssociate of Arts 8.974e-01 2.086e+00 0.430
## degreeFBachelor Electronic Engr 8.001e+00 1.393e+01 0.575
## degreeFBachelor Engr Tech 2.263e+01 9.946e+00 2.275
## degreeFBachelor of Arts 6.042e+00 2.048e+00 2.950
## degreeFBachelor of Fine Arts 3.206e+00 2.716e+00 1.180
## degreeFBachelor of Multidisc. Studies 2.543e+00 2.562e+00 0.993
## degreeFBachelor of Music 1.446e+01 2.957e+00 4.890
## degreeFBachelor of Science 5.517e+00 2.032e+00 2.715
## degreeFBachelor of Science in Nursing 3.497e+00 5.759e+00 0.607
## degreeFBachelor of Social Work 3.321e+00 3.618e+00 0.918
## degreeFBS in Aerospace Engineering 9.394e+00 3.196e+00 2.939
## degreeFBS in Agriculture 1.374e+00 3.249e+00 0.423
## degreeFBS in Biometric Systems 4.005e+00 6.221e+00 0.644
## degreeFBS in Business Administration 4.875e+00 2.122e+00 2.297
## degreeFBS in Chemical Engineering 1.327e+01 3.389e+00 3.916
## degreeFBS in Civil Engineering 8.499e+00 3.339e+00 2.545
## degreeFBS in Computer Engineering 3.883e+00 4.141e+00 0.938
## degreeFBS in Computer Science 1.158e+01 3.259e+00 3.554
## degreeFBS in Electrical Engineering 9.398e+00 3.552e+00 2.646
## degreeFBS in Forestry 2.593e+00 3.673e+00 0.706
## degreeFBS in Industrial Engineering 1.195e+01 3.780e+00 3.162
## degreeFBS in Journalism 5.210e+00 2.374e+00 2.195
## degreeFBS in Landscape Architecture 4.541e+00 4.260e+00 1.066
## degreeFBS in Mechanical Engineering 1.324e+01 3.172e+00 4.173
## degreeFBS in Mining Engineering -4.911e+00 6.210e+00 -0.791
## degreeFBS in Petroleum & Natl Gas Eng 8.194e+00 3.621e+00 2.263
## degreeFBS in Physical Education 1.876e+01 5.131e+00 3.655
## degreeFBS in Recreation -1.652e+00 5.137e+00 -0.322
## degreeFDegree Not Declared 6.683e-01 2.710e+00 0.247
## degreeFRegents Bachelor of Arts -2.915e+00 1.143e+01 -0.255
## proxStudentTypeLong Commute -2.081e+00 1.330e+00 -1.564
## proxStudentTypeShort Commute 2.155e+00 5.707e-01 3.775
## affinityStatusNo Affinity 1.614e+00 4.346e-01 3.713
## expectedFamContrib -1.680e-02 9.906e-03 -1.696
## expectedFamContrib.NATRUE 1.877e+00 1.039e+00 1.806
## aidStudentnonWVUReceived other aid -4.953e-01 6.748e-01 -0.734
## aidStudentWVUReceived WVU aid 5.907e+01 4.775e-01 123.699
## aidStudentPromScholarIs Promise -3.396e+01 3.701e+00 -9.175
## highestACT 1.783e-01 1.810e-02 9.851
## highestACT.NATRUE 1.042e+01 1.088e+00 9.576
## totalSAT 2.819e-01 2.058e-02 13.699
## totalSAT.NATRUE 1.292e+01 1.190e+00 10.860
## totalAwardnonWVU -1.011e-04 3.493e-05 -2.895
## totalAwardPromScholar 4.542e-03 8.016e-04 5.667
## Pr(>|t|)
## (Intercept) < 2e-16 ***
## studentGenderM 0.661120
## studentEthnBlack < 2e-16 ***
## studentEthnHispanic 0.303271
## studentEthnAsian 0.812841
## studentEthnNative 0.319197
## studentEthnUnknown 0.013786 *
## degreeFAssociate of Arts 0.666998
## degreeFBachelor Electronic Engr 0.565586
## degreeFBachelor Engr Tech 0.022913 *
## degreeFBachelor of Arts 0.003190 **
## degreeFBachelor of Fine Arts 0.237926
## degreeFBachelor of Multidisc. Studies 0.320904
## degreeFBachelor of Music 1.03e-06 ***
## degreeFBachelor of Science 0.006634 **
## degreeFBachelor of Science in Nursing 0.543676
## degreeFBachelor of Social Work 0.358740
## degreeFBS in Aerospace Engineering 0.003298 **
## degreeFBS in Agriculture 0.672459
## degreeFBS in Biometric Systems 0.519706
## degreeFBS in Business Administration 0.021645 *
## degreeFBS in Chemical Engineering 9.08e-05 ***
## degreeFBS in Civil Engineering 0.010930 *
## degreeFBS in Computer Engineering 0.348469
## degreeFBS in Computer Science 0.000382 ***
## degreeFBS in Electrical Engineering 0.008166 **
## degreeFBS in Forestry 0.480322
## degreeFBS in Industrial Engineering 0.001572 **
## degreeFBS in Journalism 0.028182 *
## degreeFBS in Landscape Architecture 0.286439
## degreeFBS in Mechanical Engineering 3.03e-05 ***
## degreeFBS in Mining Engineering 0.429073
## degreeFBS in Petroleum & Natl Gas Eng 0.023682 *
## degreeFBS in Physical Education 0.000258 ***
## degreeFBS in Recreation 0.747826
## degreeFDegree Not Declared 0.805233
## degreeFRegents Bachelor of Arts 0.798610
## proxStudentTypeLong Commute 0.117868
## proxStudentTypeShort Commute 0.000161 ***
## affinityStatusNo Affinity 0.000206 ***
## expectedFamContrib 0.089898 .
## expectedFamContrib.NATRUE 0.071016 .
## aidStudentnonWVUReceived other aid 0.463029
## aidStudentWVUReceived WVU aid < 2e-16 ***
## aidStudentPromScholarIs Promise < 2e-16 ***
## highestACT < 2e-16 ***
## highestACT.NATRUE < 2e-16 ***
## totalSAT < 2e-16 ***
## totalSAT.NATRUE < 2e-16 ***
## totalAwardnonWVU 0.003796 **
## totalAwardPromScholar 1.50e-08 ***
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
##
## Residual standard error: 19.48 on 8539 degrees of freedom
## Multiple R-squared: 0.6987, Adjusted R-squared: 0.697
## F-statistic: 396.1 on 50 and 8539 DF, p-value: < 2.2e-16
ncvTest(modWVUAid)
## Non-constant Variance Score Test
## Variance formula: ~ fitted.values
## Chisquare = 4194.659 Df = 1 p = 0
plot(modWVUAid)
mmp(modWVUAid)
summary.aov(modWVUAid)
## Df Sum Sq Mean Sq F value Pr(>F)
## studentGender 1 11 11 0.029 0.863919
## studentEthn 5 89740 17948 47.284 < 2e-16 ***
## degreeF 30 423187 14106 37.163 < 2e-16 ***
## proxStudentType 2 8225 4113 10.835 2.00e-05 ***
## affinityStatus 1 3232 3232 8.515 0.003532 **
## expectedFamContrib 1 33203 33203 87.473 < 2e-16 ***
## expectedFamContrib.NA 1 13185 13185 34.736 3.92e-09 ***
## aidStudentnonWVU 1 193383 193383 509.470 < 2e-16 ***
## aidStudentWVU 1 6470783 6470783 17047.363 < 2e-16 ***
## aidStudentPromScholar 1 134270 134270 353.736 < 2e-16 ***
## highestACT 1 4948 4948 13.034 0.000308 ***
## highestACT.NA 1 51116 51116 134.665 < 2e-16 ***
## totalSAT 1 29303 29303 77.199 < 2e-16 ***
## totalSAT.NA 1 47609 47609 125.427 < 2e-16 ***
## totalAwardnonWVU 1 2585 2585 6.809 0.009085 **
## totalAwardPromScholar 1 12189 12189 32.112 1.50e-08 ***
## Residuals 8539 3241206 380
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
plot(totalAwardWVU ~ modWVUAid$fitted.values)
#Other model approach:
totalAwardWVUMod3 <- lm(sqrt(totalAwardWVU) ~ studentGender + studentEthn + degreeF + degreeType + studentLoc + stateIndicator + proxStudentType + scaledAcademAchiev + affinityStatus + expectedFamContrib, data = finDataTableWVU)
summary(totalAwardWVUMod3)
##
## Call:
## lm(formula = sqrt(totalAwardWVU) ~ studentGender + studentEthn +
## degreeF + degreeType + studentLoc + stateIndicator + proxStudentType +
## scaledAcademAchiev + affinityStatus + expectedFamContrib,
## data = finDataTableWVU)
##
## Residuals:
## Min 1Q Median 3Q Max
## -103.217 -24.549 -5.017 19.719 187.986
##
## Coefficients: (5 not defined because of singularities)
## Estimate Std. Error t value
## (Intercept) -73.18893 33.04051 -2.215
## studentGenderM -0.07648 0.73554 -0.104
## studentEthnBlack 9.94979 1.76711 5.631
## studentEthnHispanic -0.26017 3.76653 -0.069
## studentEthnAsian 0.56880 3.24972 0.175
## studentEthnNative 9.10260 8.22911 1.106
## studentEthnUnknown 4.42730 0.77710 5.697
## degreeFAssociate of Arts 4.88580 3.49915 1.396
## degreeFBachelor Electronic Engr 2.30242 23.38293 0.098
## degreeFBachelor Engr Tech 40.50860 16.72631 2.422
## degreeFBachelor of Arts 8.13814 3.44674 2.361
## degreeFBachelor of Fine Arts 3.82727 4.57410 0.837
## degreeFBachelor of Multidisc. Studies 4.70740 4.30769 1.093
## degreeFBachelor of Music 29.44563 4.96853 5.926
## degreeFBachelor of Science 10.01735 3.42204 2.927
## degreeFBachelor of Science in Nursing 14.38266 9.67316 1.487
## degreeFBachelor of Social Work -1.93530 6.11300 -0.317
## degreeFBS in Aerospace Engineering 9.50975 5.38567 1.766
## degreeFBS in Agriculture 2.45791 5.46400 0.450
## degreeFBS in Biometric Systems 10.32416 10.44014 0.989
## degreeFBS in Business Administration 7.37477 3.57521 2.063
## degreeFBS in Chemical Engineering 12.42549 5.70203 2.179
## degreeFBS in Civil Engineering 23.81915 5.61094 4.245
## degreeFBS in Computer Engineering 12.12923 6.95250 1.745
## degreeFBS in Computer Science 24.93995 5.46371 4.565
## degreeFBS in Electrical Engineering 16.08203 5.97627 2.691
## degreeFBS in Forestry 4.44258 6.20946 0.715
## degreeFBS in Industrial Engineering 10.66108 6.36184 1.676
## degreeFBS in Journalism 8.29489 3.99769 2.075
## degreeFBS in Landscape Architecture 18.36802 7.17340 2.561
## degreeFBS in Mechanical Engineering 22.00283 5.35739 4.107
## degreeFBS in Mining Engineering 3.66000 10.48486 0.349
## degreeFBS in Petroleum & Natl Gas Eng 11.67234 6.12169 1.907
## degreeFBS in Physical Education 37.88957 8.70572 4.352
## degreeFBS in Recreation -10.29167 8.63223 -1.192
## degreeFDegree Not Declared 7.48866 4.55802 1.643
## degreeFRegents Bachelor of Arts 7.05486 19.18867 0.368
## degreeTypeRegent Degree NA NA NA
## degreeTypeDegree Not Declared NA NA NA
## degreeTypeAssociate Arts NA NA NA
## degreeTypeAssociate Applied Sci NA NA NA
## studentLocAK -6.96882 46.34705 -0.150
## studentLocAL 18.84469 35.46334 0.531
## studentLocAP 30.85610 46.36522 0.666
## studentLocAR 12.22545 36.67811 0.333
## studentLocAZ -1.56243 40.15331 -0.039
## studentLocBC 89.46949 40.15434 2.228
## studentLocCA 38.33453 33.18032 1.155
## studentLocCO 47.99947 34.39953 1.395
## studentLocCT 20.64168 33.03076 0.625
## studentLocDC 21.89776 33.01180 0.663
## studentLocDE 22.80921 33.03766 0.690
## studentLocFL 44.18063 33.06616 1.336
## studentLocFR 89.49559 33.54924 2.668
## studentLocGA 57.33753 33.23487 1.725
## studentLocIA 6.79058 35.44057 0.192
## studentLocIL 39.93331 33.28116 1.200
## studentLocIN 69.77234 34.04008 2.050
## studentLocKS -11.79677 40.15248 -0.294
## studentLocKY 41.47222 34.59348 1.199
## studentLocLA 58.08130 40.16076 1.446
## studentLocMA 19.69160 33.08177 0.595
## studentLocMD 32.45002 32.82926 0.988
## studentLocME 35.37004 37.86356 0.934
## studentLocMI 47.79005 33.66638 1.420
## studentLocMN 65.00878 35.94366 1.809
## studentLocMO 14.20808 35.93350 0.395
## studentLocMS 36.18139 40.14259 0.901
## studentLocMT 172.35225 46.35961 3.718
## studentLocNC 38.97249 33.17042 1.175
## studentLocND -6.26191 46.37529 -0.135
## studentLocNE -2.70922 46.69107 -0.058
## studentLocNH 25.54774 34.58451 0.739
## studentLocNJ 29.42506 32.84324 0.896
## studentLocNM 0.98568 46.35581 0.021
## studentLocNV 55.62309 36.70257 1.516
## studentLocNY 28.97907 32.86567 0.882
## studentLocOH 35.85442 32.86269 1.091
## studentLocOK 18.14714 35.93632 0.505
## studentLocON 148.76452 36.67374 4.056
## studentLocOR 67.26994 37.86859 1.776
## studentLocPA 39.56166 32.82573 1.205
## studentLocPR 89.18911 46.34846 1.924
## studentLocRI 19.46314 35.06197 0.555
## studentLocSC 38.19504 33.58086 1.137
## studentLocSD 17.22388 46.38549 0.371
## studentLocTN 51.85806 33.61877 1.543
## studentLocTX 59.37620 33.13484 1.792
## studentLocUT 65.12679 46.35594 1.405
## studentLocVA 27.29474 32.83223 0.831
## studentLocVT 32.36576 34.79549 0.930
## studentLocWA 14.69486 34.81155 0.422
## studentLocWI 36.98325 34.04898 1.086
## studentLocWV 24.09984 32.80411 0.735
## stateIndicatorIn-State NA NA NA
## proxStudentTypeLong Commute -0.21729 2.27596 -0.095
## proxStudentTypeShort Commute 5.43824 1.08601 5.008
## scaledAcademAchiev 0.90378 0.03401 26.575
## affinityStatusNo Affinity 3.03372 0.72444 4.188
## expectedFamContrib 0.06969 0.01611 4.325
## Pr(>|t|)
## (Intercept) 0.026778 *
## studentGenderM 0.917185
## studentEthnBlack 1.85e-08 ***
## studentEthnHispanic 0.944931
## studentEthnAsian 0.861060
## studentEthnNative 0.268695
## studentEthnUnknown 1.26e-08 ***
## degreeFAssociate of Arts 0.162666
## degreeFBachelor Electronic Engr 0.921565
## degreeFBachelor Engr Tech 0.015463 *
## degreeFBachelor of Arts 0.018243 *
## degreeFBachelor of Fine Arts 0.402769
## degreeFBachelor of Multidisc. Studies 0.274517
## degreeFBachelor of Music 3.22e-09 ***
## degreeFBachelor of Science 0.003428 **
## degreeFBachelor of Science in Nursing 0.137088
## degreeFBachelor of Social Work 0.751564
## degreeFBS in Aerospace Engineering 0.077474 .
## degreeFBS in Agriculture 0.652839
## degreeFBS in Biometric Systems 0.322745
## degreeFBS in Business Administration 0.039167 *
## degreeFBS in Chemical Engineering 0.029349 *
## degreeFBS in Civil Engineering 2.21e-05 ***
## degreeFBS in Computer Engineering 0.081093 .
## degreeFBS in Computer Science 5.07e-06 ***
## degreeFBS in Electrical Engineering 0.007138 **
## degreeFBS in Forestry 0.474348
## degreeFBS in Industrial Engineering 0.093817 .
## degreeFBS in Journalism 0.038024 *
## degreeFBS in Landscape Architecture 0.010467 *
## degreeFBS in Mechanical Engineering 4.05e-05 ***
## degreeFBS in Mining Engineering 0.727042
## degreeFBS in Petroleum & Natl Gas Eng 0.056591 .
## degreeFBS in Physical Education 1.36e-05 ***
## degreeFBS in Recreation 0.233201
## degreeFDegree Not Declared 0.100428
## degreeFRegents Bachelor of Arts 0.713138
## degreeTypeRegent Degree NA
## degreeTypeDegree Not Declared NA
## degreeTypeAssociate Arts NA
## degreeTypeAssociate Applied Sci NA
## studentLocAK 0.880483
## studentLocAL 0.595166
## studentLocAP 0.505748
## studentLocAR 0.738903
## studentLocAZ 0.968962
## studentLocBC 0.025897 *
## studentLocCA 0.247984
## studentLocCO 0.162946
## studentLocCT 0.532038
## studentLocDC 0.507136
## studentLocDE 0.489961
## studentLocFL 0.181543
## studentLocFR 0.007654 **
## studentLocGA 0.084524 .
## studentLocIA 0.848057
## studentLocIL 0.230220
## studentLocIN 0.040423 *
## studentLocKS 0.768918
## studentLocKY 0.230622
## studentLocLA 0.148152
## studentLocMA 0.551699
## studentLocMD 0.322961
## studentLocME 0.350256
## studentLocMI 0.155785
## studentLocMN 0.070544 .
## studentLocMO 0.692558
## studentLocMS 0.367443
## studentLocMT 0.000202 ***
## studentLocNC 0.240061
## studentLocND 0.892594
## studentLocNE 0.953731
## studentLocNH 0.460107
## studentLocNJ 0.370319
## studentLocNM 0.983036
## studentLocNV 0.129681
## studentLocNY 0.377941
## studentLocOH 0.275287
## studentLocOK 0.613586
## studentLocON 5.03e-05 ***
## studentLocOR 0.075702 .
## studentLocPA 0.228159
## studentLocPR 0.054348 .
## studentLocRI 0.578836
## studentLocSC 0.255401
## studentLocSD 0.710408
## studentLocTN 0.122981
## studentLocTX 0.073175 .
## studentLocUT 0.160079
## studentLocVA 0.405805
## studentLocVT 0.352309
## studentLocWA 0.672944
## studentLocWI 0.277431
## studentLocWV 0.462567
## stateIndicatorIn-State NA
## proxStudentTypeLong Commute 0.923942
## proxStudentTypeShort Commute 5.62e-07 ***
## scaledAcademAchiev < 2e-16 ***
## affinityStatusNo Affinity 2.85e-05 ***
## expectedFamContrib 1.54e-05 ***
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
##
## Residual standard error: 32.72 on 8495 degrees of freedom
## Multiple R-squared: 0.168, Adjusted R-squared: 0.1588
## F-statistic: 18.25 on 94 and 8495 DF, p-value: < 2.2e-16
ncvTest(totalAwardWVUMod3)
## Non-constant Variance Score Test
## Variance formula: ~ fitted.values
## Chisquare = 493.3887 Df = 1 p = 2.608982e-109
plot(totalAwardWVUMod3)
## Warning: not plotting observations with leverage one:
## 480, 2813, 7441
## Warning: not plotting observations with leverage one:
## 480, 2813, 7441
## Warning in sqrt(crit * p * (1 - hh)/hh): NaNs produced
## Warning in sqrt(crit * p * (1 - hh)/hh): NaNs produced
mmp(totalAwardWVUMod3)
par(mfrow = c(1, 2))
plot(log(totalAwardWVU) ~ modWVUAid$fitted.values)
plot(log(totalAwardWVU) ~ totalAwardWVUMod3$fitted.values)
par(mfrow = c(1, 2))
mmp(modWVUAid, sd = TRUE)
mmp(totalAwardWVUMod3, sd = TRUE)
#test model predictions
names(finDataTableWVU)
## [1] "rule49Grant" "instEmployAid"
## [3] "instGrantAcademic" "instGrantAthletic"
## [5] "instGrantOther" "studentGender"
## [7] "studentEthn" "degreeF"
## [9] "degreeType" "studentLoc"
## [11] "stateIndicator" "proxStudentType"
## [13] "highSchoolGPA" "prevColGPA"
## [15] "highestACT" "totalSAT"
## [17] "scoreGED" "scaledAcademAchiev"
## [19] "affinityStatus" "expectedFamContrib"
## [21] "totalAwardWVU" "totalAwardnonWVU"
## [23] "totalAwardPromScholar" "aidStudentWVU"
## [25] "aidStudentnonWVU" "aidStudentPromScholar"
## [27] "highSchoolGPA.NA" "prevColGPA.NA"
## [29] "highestACT.NA" "totalSAT.NA"
## [31] "scoreGED.NA" "expectedFamContrib.NA"
## [33] "studentEthn.NA" "scaledAcademAchiev.NA"
which(finDataTableWVU[,21] > 40000)
## [1] 1355 3654 7276 7369 7442
fitResults <- predict(modWVUAid, newdata = finDataTableWVU[1355,], type = "response")
(fitResults)^2
## 1355
## 3551.281
finDataTableWVU[1355, 21]
## [1] 41170
#Unfortunately while the models fit that data well, testing it with the predictions about show that the results do not seem to accurately predict totalAwardWVU
Modeling students who received no WVU direct aid with those who did receive WVU aid created mixed results and lowered the quality of the prediction. By modelling them separately, we can provide better insight to the university.
By modeling just the population that did receive at least some totalAwardWVU we will get more accurate predicitors. With this, we can see what variables were important for increasing the amount of WVU aid that the university decided to issue to a student.
#run model on subset of students that received WVU aid #AL12 Total WVU Award > 0
finDataTableWVU_AL12 <- subset(finDataTableWVU, totalAwardWVU > 0)
dim(finDataTableWVU_AL12)
## [1] 4396 34
summary(finDataTableWVU_AL12)
## rule49Grant instEmployAid instGrantAcademic instGrantAthletic
## Min. : 0 Min. : 0.0 Min. : 0 Min. : 0.0
## 1st Qu.: 0 1st Qu.: 0.0 1st Qu.: 0 1st Qu.: 0.0
## Median : 0 Median : 0.0 Median : 0 Median : 0.0
## Mean : 1856 Mean : 369.9 Mean : 1029 Mean : 588.6
## 3rd Qu.: 3000 3rd Qu.: 0.0 3rd Qu.: 2000 3rd Qu.: 0.0
## Max. :21336 Max. :17233.0 Max. :15603 Max. :41170.0
##
## instGrantOther studentGender studentEthn
## Min. : 0 F:2068 White :1638
## 1st Qu.: 0 M:2328 Black : 169
## Median : 0 Hispanic: 31
## Mean : 367 Asian : 51
## 3rd Qu.: 0 Native : 8
## Max. :9338 Unknown :2499
##
## degreeF degreeType
## Bachelor of Science :1925 Bachelor Degree :4018
## Bachelor of Arts : 990 Regent Degree : 1
## BS in Business Administration : 396 Degree Not Declared : 50
## Associate of Arts : 302 Associate Arts : 302
## BS in Journalism : 126 Associate Applied Sci: 25
## Bachelor of Multidisc. Studies: 76
## (Other) : 581
## studentLoc stateIndicator proxStudentType
## WV :2324 Out-of-State:2072 Res or Out-of-State:3444
## PA : 540 In-State :2324 Long Commute : 124
## MD : 376 Short Commute : 828
## VA : 296
## NJ : 201
## OH : 188
## (Other): 471
## highSchoolGPA prevColGPA highestACT totalSAT
## Min. : 1.00 Min. : 1.00 Min. : 1.00 Min. : 1.00
## 1st Qu.: 68.39 1st Qu.: 1.00 1st Qu.: 37.33 1st Qu.: 39.08
## Median : 78.21 Median : 72.03 Median : 53.68 Median : 52.62
## Mean : 75.92 Mean : 52.50 Mean : 46.62 Mean : 46.11
## 3rd Qu.: 88.90 3rd Qu.: 90.59 3rd Qu.: 64.58 3rd Qu.: 61.08
## Max. :100.00 Max. :100.00 Max. :100.00 Max. :100.00
##
## scoreGED scaledAcademAchiev affinityStatus
## Min. : 1.000 Min. : 23.03 Some Affinity:1939
## 1st Qu.: 1.000 1st Qu.: 62.23 No Affinity :2457
## Median : 1.000 Median : 68.98
## Mean : 2.145 Mean : 68.35
## 3rd Qu.: 1.000 3rd Qu.: 75.07
## Max. :100.000 Max. :100.00
##
## expectedFamContrib totalAwardWVU totalAwardnonWVU totalAwardPromScholar
## Min. : 0.000 Min. : 25 Min. : 0 Min. : 0
## 1st Qu.: 2.024 1st Qu.: 1500 1st Qu.: 2375 1st Qu.: 0
## Median : 11.176 Median : 3000 Median : 6339 Median : 0
## Mean : 19.440 Mean : 4211 Mean : 8397 Mean :1558
## 3rd Qu.: 27.540 3rd Qu.: 5000 3rd Qu.:13054 3rd Qu.:4750
## Max. :100.000 Max. :43560 Max. :42328 Max. :7125
##
## aidStudentWVU aidStudentnonWVU
## Did not received WVU aid: 0 Did not received other aid: 942
## Received WVU aid :4396 Received other aid :3454
##
##
##
##
##
## aidStudentPromScholar highSchoolGPA.NA prevColGPA.NA highestACT.NA
## Is not Promise:2899 Mode :logical Mode :logical Mode :logical
## Is Promise :1497 FALSE:4315 FALSE:2733 FALSE:3502
## TRUE :81 TRUE :1663 TRUE :894
## NA's :0 NA's :0 NA's :0
##
##
##
## totalSAT.NA scoreGED.NA expectedFamContrib.NA studentEthn.NA
## Mode :logical Mode :logical Mode :logical Mode :logical
## FALSE:3610 FALSE:65 FALSE:4260 FALSE:4377
## TRUE :786 TRUE :4331 TRUE :136 TRUE :19
## NA's :0 NA's :0 NA's :0 NA's :0
##
##
##
## scaledAcademAchiev.NA
## Mode :logical
## FALSE:4396
## NA's :0
##
##
##
##
sum(finDataTableWVU_AL12$totalAwardWVU)
## [1] 18510879
modWVUAid_1 <- lm(totalAwardWVU ~ studentGender + studentEthn + degreeF + studentLoc + proxStudentType + affinityStatus + expectedFamContrib + expectedFamContrib.NA + aidStudentnonWVU + aidStudentPromScholar + highestACT + highestACT.NA + totalSAT + totalSAT.NA + totalAwardnonWVU + totalAwardPromScholar + highSchoolGPA + highSchoolGPA.NA + prevColGPA + prevColGPA.NA + scoreGED + scoreGED.NA + scaledAcademAchiev, data = finDataTableWVU_AL12)
summary(modWVUAid_1)
##
## Call:
## lm(formula = totalAwardWVU ~ studentGender + studentEthn + degreeF +
## studentLoc + proxStudentType + affinityStatus + expectedFamContrib +
## expectedFamContrib.NA + aidStudentnonWVU + aidStudentPromScholar +
## highestACT + highestACT.NA + totalSAT + totalSAT.NA + totalAwardnonWVU +
## totalAwardPromScholar + highSchoolGPA + highSchoolGPA.NA +
## prevColGPA + prevColGPA.NA + scoreGED + scoreGED.NA + scaledAcademAchiev,
## data = finDataTableWVU_AL12)
##
## Residuals:
## Min 1Q Median 3Q Max
## -13043 -2157 -716 906 37444
##
## Coefficients:
## Estimate Std. Error t value
## (Intercept) 8.457e+02 5.328e+03 0.159
## studentGenderM 5.309e+01 1.429e+02 0.371
## studentEthnBlack 3.457e+03 3.760e+02 9.195
## studentEthnHispanic 1.061e+03 8.085e+02 1.312
## studentEthnAsian 8.626e+01 6.403e+02 0.135
## studentEthnNative 3.054e+03 1.579e+03 1.934
## studentEthnUnknown 6.965e+01 1.487e+02 0.468
## degreeFAssociate of Arts 2.553e+02 9.298e+02 0.275
## degreeFBachelor Engr Tech 5.240e+03 2.719e+03 1.927
## degreeFBachelor of Arts 2.181e+03 9.150e+02 2.383
## degreeFBachelor of Fine Arts 1.383e+03 1.083e+03 1.277
## degreeFBachelor of Multidisc. Studies 1.336e+03 1.037e+03 1.289
## degreeFBachelor of Music 3.241e+03 1.067e+03 3.037
## degreeFBachelor of Science 1.881e+03 9.096e+02 2.068
## degreeFBachelor of Science in Nursing 1.345e+03 1.906e+03 0.706
## degreeFBachelor of Social Work 1.488e+03 1.418e+03 1.050
## degreeFBS in Aerospace Engineering 3.713e+03 1.225e+03 3.031
## degreeFBS in Agriculture 1.063e+03 1.233e+03 0.862
## degreeFBS in Biometric Systems 2.582e+03 2.182e+03 1.183
## degreeFBS in Business Administration 1.687e+03 9.342e+02 1.806
## degreeFBS in Chemical Engineering 3.576e+03 1.236e+03 2.893
## degreeFBS in Civil Engineering 2.525e+03 1.167e+03 2.164
## degreeFBS in Computer Engineering 1.386e+03 1.363e+03 1.016
## degreeFBS in Computer Science 2.955e+03 1.122e+03 2.635
## degreeFBS in Electrical Engineering 2.525e+03 1.243e+03 2.031
## degreeFBS in Forestry 1.041e+03 1.503e+03 0.693
## degreeFBS in Industrial Engineering 4.614e+03 1.404e+03 3.286
## degreeFBS in Journalism 1.982e+03 9.888e+02 2.004
## degreeFBS in Landscape Architecture 1.217e+03 1.414e+03 0.861
## degreeFBS in Mechanical Engineering 3.953e+03 1.146e+03 3.451
## degreeFBS in Mining Engineering -1.187e+03 1.908e+03 -0.622
## degreeFBS in Petroleum & Natl Gas Eng 1.987e+03 1.242e+03 1.600
## degreeFBS in Physical Education 2.200e+03 1.546e+03 1.423
## degreeFBS in Recreation -9.176e+02 2.396e+03 -0.383
## degreeFDegree Not Declared 2.090e+02 1.096e+03 0.191
## degreeFRegents Bachelor of Arts 6.978e+02 4.532e+03 0.154
## studentLocAR -3.129e+03 5.206e+03 -0.601
## studentLocBC 2.692e+04 5.165e+03 5.213
## studentLocCA 3.010e+03 2.783e+03 1.082
## studentLocCO 6.270e+03 3.283e+03 1.910
## studentLocCT -1.355e+03 2.764e+03 -0.490
## studentLocDC -5.956e+02 2.883e+03 -0.207
## studentLocDE 1.715e+03 2.818e+03 0.609
## studentLocFL 1.648e+03 2.711e+03 0.608
## studentLocFR 3.519e+03 2.803e+03 1.256
## studentLocGA 6.620e+03 2.770e+03 2.390
## studentLocIL 3.037e+03 2.818e+03 1.078
## studentLocIN 1.092e+04 3.050e+03 3.579
## studentLocKY -1.718e+02 3.115e+03 -0.055
## studentLocLA 7.526e+03 5.147e+03 1.462
## studentLocMA 1.466e+02 2.807e+03 0.052
## studentLocMD 3.968e+01 2.624e+03 0.015
## studentLocME -9.087e+02 4.081e+03 -0.223
## studentLocMI 7.377e+03 2.969e+03 2.485
## studentLocMN 9.862e+03 3.669e+03 2.688
## studentLocMO 1.519e+03 5.147e+03 0.295
## studentLocMS 1.829e+03 5.145e+03 0.355
## studentLocMT 2.929e+04 5.159e+03 5.677
## studentLocNC 2.934e+03 2.789e+03 1.052
## studentLocNH -1.856e+03 3.295e+03 -0.563
## studentLocNJ 3.416e+02 2.634e+03 0.130
## studentLocNV 2.165e+03 3.661e+03 0.591
## studentLocNY 4.657e+02 2.646e+03 0.176
## studentLocOH 3.851e+02 2.633e+03 0.146
## studentLocOK 1.356e+04 5.147e+03 2.635
## studentLocON 1.754e+04 3.436e+03 5.104
## studentLocOR 1.040e+04 4.079e+03 2.550
## studentLocPA 1.139e+03 2.621e+03 0.435
## studentLocPR 6.632e+03 5.151e+03 1.287
## studentLocRI -3.113e+02 4.078e+03 -0.076
## studentLocSC 2.533e+03 2.939e+03 0.862
## studentLocSD -1.730e+03 5.157e+03 -0.335
## studentLocTN 1.480e+03 2.855e+03 0.518
## studentLocTX 6.634e+03 2.735e+03 2.425
## studentLocUT -3.846e+02 5.150e+03 -0.075
## studentLocVA -2.046e+02 2.625e+03 -0.078
## studentLocVT -1.824e+03 3.446e+03 -0.529
## studentLocWA 1.042e+03 4.101e+03 0.254
## studentLocWI 2.169e+03 3.109e+03 0.697
## studentLocWV -4.469e+01 2.622e+03 -0.017
## proxStudentTypeLong Commute -9.106e+01 4.178e+02 -0.218
## proxStudentTypeShort Commute 1.446e+03 2.082e+02 6.947
## affinityStatusNo Affinity 3.421e+02 1.399e+02 2.446
## expectedFamContrib -1.183e+01 3.073e+00 -3.848
## expectedFamContrib.NATRUE 9.537e+02 4.199e+02 2.271
## aidStudentnonWVUReceived other aid -1.373e+02 2.327e+02 -0.590
## aidStudentPromScholarIs Promise -2.816e+03 9.439e+02 -2.983
## highestACT 5.279e+01 1.019e+01 5.179
## highestACT.NATRUE 3.419e+03 6.819e+02 5.014
## totalSAT 7.686e+01 1.090e+01 7.054
## totalSAT.NATRUE 4.122e+03 7.381e+02 5.585
## totalAwardnonWVU -5.041e-02 1.174e-02 -4.294
## totalAwardPromScholar 1.826e-01 2.019e-01 0.904
## highSchoolGPA 2.402e+01 1.095e+01 2.194
## highSchoolGPA.NATRUE 2.362e+03 9.431e+02 2.505
## prevColGPA 2.515e+00 9.760e+00 0.258
## prevColGPA.NATRUE 1.100e+02 7.079e+02 0.155
## scoreGED -6.345e+01 5.564e+01 -1.140
## scoreGED.NATRUE -4.897e+03 4.338e+03 -1.129
## scaledAcademAchiev -3.922e+01 2.839e+01 -1.382
## Pr(>|t|)
## (Intercept) 0.873880
## studentGenderM 0.710380
## studentEthnBlack < 2e-16 ***
## studentEthnHispanic 0.189527
## studentEthnAsian 0.892840
## studentEthnNative 0.053234 .
## studentEthnUnknown 0.639565
## degreeFAssociate of Arts 0.783629
## degreeFBachelor Engr Tech 0.054057 .
## degreeFBachelor of Arts 0.017212 *
## degreeFBachelor of Fine Arts 0.201557
## degreeFBachelor of Multidisc. Studies 0.197457
## degreeFBachelor of Music 0.002403 **
## degreeFBachelor of Science 0.038723 *
## degreeFBachelor of Science in Nursing 0.480370
## degreeFBachelor of Social Work 0.293987
## degreeFBS in Aerospace Engineering 0.002452 **
## degreeFBS in Agriculture 0.388724
## degreeFBS in Biometric Systems 0.236815
## degreeFBS in Business Administration 0.070972 .
## degreeFBS in Chemical Engineering 0.003841 **
## degreeFBS in Civil Engineering 0.030539 *
## degreeFBS in Computer Engineering 0.309454
## degreeFBS in Computer Science 0.008456 **
## degreeFBS in Electrical Engineering 0.042286 *
## degreeFBS in Forestry 0.488360
## degreeFBS in Industrial Engineering 0.001023 **
## degreeFBS in Journalism 0.045101 *
## degreeFBS in Landscape Architecture 0.389538
## degreeFBS in Mechanical Engineering 0.000564 ***
## degreeFBS in Mining Engineering 0.533723
## degreeFBS in Petroleum & Natl Gas Eng 0.109590
## degreeFBS in Physical Education 0.154758
## degreeFBS in Recreation 0.701810
## degreeFDegree Not Declared 0.848708
## degreeFRegents Bachelor of Arts 0.877628
## studentLocAR 0.547865
## studentLocBC 1.95e-07 ***
## studentLocCA 0.279413
## studentLocCO 0.056208 .
## studentLocCT 0.623903
## studentLocDC 0.836321
## studentLocDE 0.542734
## studentLocFL 0.543322
## studentLocFR 0.209349
## studentLocGA 0.016884 *
## studentLocIL 0.281247
## studentLocIN 0.000349 ***
## studentLocKY 0.956025
## studentLocLA 0.143738
## studentLocMA 0.958351
## studentLocMD 0.987936
## studentLocME 0.823830
## studentLocMI 0.012994 *
## studentLocMN 0.007208 **
## studentLocMO 0.767905
## studentLocMS 0.722316
## studentLocMT 1.46e-08 ***
## studentLocNC 0.292949
## studentLocNH 0.573302
## studentLocNJ 0.896796
## studentLocNV 0.554319
## studentLocNY 0.860296
## studentLocOH 0.883718
## studentLocOK 0.008433 **
## studentLocON 3.47e-07 ***
## studentLocOR 0.010806 *
## studentLocPA 0.663941
## studentLocPR 0.198036
## studentLocRI 0.939161
## studentLocSC 0.388881
## studentLocSD 0.737322
## studentLocTN 0.604181
## studentLocTX 0.015334 *
## studentLocUT 0.940479
## studentLocVA 0.937881
## studentLocVT 0.596614
## studentLocWA 0.799372
## studentLocWI 0.485545
## studentLocWV 0.986399
## proxStudentTypeLong Commute 0.827477
## proxStudentTypeShort Commute 4.29e-12 ***
## affinityStatusNo Affinity 0.014497 *
## expectedFamContrib 0.000121 ***
## expectedFamContrib.NATRUE 0.023187 *
## aidStudentnonWVUReceived other aid 0.555352
## aidStudentPromScholarIs Promise 0.002867 **
## highestACT 2.33e-07 ***
## highestACT.NATRUE 5.55e-07 ***
## totalSAT 2.02e-12 ***
## totalSAT.NATRUE 2.48e-08 ***
## totalAwardnonWVU 1.80e-05 ***
## totalAwardPromScholar 0.365910
## highSchoolGPA 0.028289 *
## highSchoolGPA.NATRUE 0.012282 *
## prevColGPA 0.796662
## prevColGPA.NATRUE 0.876545
## scoreGED 0.254208
## scoreGED.NATRUE 0.258976
## scaledAcademAchiev 0.167185
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
##
## Residual standard error: 4423 on 4296 degrees of freedom
## Multiple R-squared: 0.2351, Adjusted R-squared: 0.2174
## F-statistic: 13.33 on 99 and 4296 DF, p-value: < 2.2e-16
anova(modWVUAid_1) #promScholar aid, prevColGPA, scoreGED, and scaledAcademAchiev amount is not sig
## Analysis of Variance Table
##
## Response: totalAwardWVU
## Df Sum Sq Mean Sq F value Pr(>F)
## studentGender 1 1.5281e+08 152813204 7.8113 0.005215 **
## studentEthn 5 1.8847e+09 376934139 19.2676 < 2.2e-16 ***
## degreeF 29 3.4059e+09 117446285 6.0035 < 2.2e-16 ***
## studentLoc 44 1.1679e+10 265438147 13.5683 < 2.2e-16 ***
## proxStudentType 2 2.2013e+09 1100647812 56.2614 < 2.2e-16 ***
## affinityStatus 1 1.3637e+08 136367153 6.9706 0.008316 **
## expectedFamContrib 1 1.5669e+08 156692734 8.0096 0.004675 **
## expectedFamContrib.NA 1 4.2053e+08 420530903 21.4961 3.651e-06 ***
## aidStudentnonWVU 1 6.7344e+08 673441362 34.4241 4.766e-09 ***
## aidStudentPromScholar 1 7.2936e+08 729362741 37.2826 1.112e-09 ***
## highestACT 1 7.6638e+07 76638455 3.9175 0.047850 *
## highestACT.NA 1 1.4968e+09 1496841056 76.5135 < 2.2e-16 ***
## totalSAT 1 7.0771e+08 707708990 36.1757 1.953e-09 ***
## totalSAT.NA 1 1.4898e+09 1489793942 76.1533 < 2.2e-16 ***
## totalAwardnonWVU 1 3.7087e+08 370869041 18.9576 1.368e-05 ***
## totalAwardPromScholar 1 1.5235e+07 15234940 0.7788 0.377570
## highSchoolGPA 1 1.4633e+07 14633374 0.7480 0.387156
## highSchoolGPA.NA 1 8.9334e+07 89334167 4.5665 0.032660 *
## prevColGPA 1 2.3815e+07 23815079 1.2173 0.269944
## prevColGPA.NA 1 2.6160e+07 26160439 1.3372 0.247587
## scoreGED 1 2.2754e+06 2275429 0.1163 0.733086
## scoreGED.NA 1 3.3375e+07 33375106 1.7060 0.191572
## scaledAcademAchiev 1 3.7339e+07 37339193 1.9087 0.167185
## Residuals 4296 8.4043e+10 19563091
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
modWVUAid_2 <- lm(totalAwardWVU ~ studentGender + studentEthn + degreeF + studentLoc + proxStudentType + affinityStatus + expectedFamContrib + expectedFamContrib.NA + aidStudentnonWVU + aidStudentPromScholar + highSchoolGPA + highSchoolGPA.NA + highestACT + highestACT.NA + totalSAT + totalSAT.NA + totalAwardnonWVU, data = finDataTableWVU_AL12)
summary(modWVUAid_2)
##
## Call:
## lm(formula = totalAwardWVU ~ studentGender + studentEthn + degreeF +
## studentLoc + proxStudentType + affinityStatus + expectedFamContrib +
## expectedFamContrib.NA + aidStudentnonWVU + aidStudentPromScholar +
## highSchoolGPA + highSchoolGPA.NA + highestACT + highestACT.NA +
## totalSAT + totalSAT.NA + totalAwardnonWVU, data = finDataTableWVU_AL12)
##
## Residuals:
## Min 1Q Median 3Q Max
## -13066 -2169 -705 890 37463
##
## Coefficients:
## Estimate Std. Error t value
## (Intercept) -4.268e+03 2.834e+03 -1.506
## studentGenderM 6.219e+01 1.428e+02 0.435
## studentEthnBlack 3.470e+03 3.756e+02 9.240
## studentEthnHispanic 1.028e+03 8.080e+02 1.272
## studentEthnAsian 1.391e+02 6.391e+02 0.218
## studentEthnNative 3.005e+03 1.579e+03 1.904
## studentEthnUnknown 7.480e+01 1.486e+02 0.503
## degreeFAssociate of Arts 2.418e+02 9.268e+02 0.261
## degreeFBachelor Engr Tech 5.151e+03 2.719e+03 1.895
## degreeFBachelor of Arts 2.215e+03 9.140e+02 2.424
## degreeFBachelor of Fine Arts 1.441e+03 1.082e+03 1.332
## degreeFBachelor of Multidisc. Studies 1.349e+03 1.036e+03 1.302
## degreeFBachelor of Music 3.224e+03 1.067e+03 3.022
## degreeFBachelor of Science 1.901e+03 9.088e+02 2.092
## degreeFBachelor of Science in Nursing 1.342e+03 1.903e+03 0.705
## degreeFBachelor of Social Work 1.496e+03 1.416e+03 1.056
## degreeFBS in Aerospace Engineering 3.730e+03 1.223e+03 3.049
## degreeFBS in Agriculture 1.076e+03 1.232e+03 0.873
## degreeFBS in Biometric Systems 2.710e+03 2.181e+03 1.242
## degreeFBS in Business Administration 1.709e+03 9.334e+02 1.831
## degreeFBS in Chemical Engineering 3.493e+03 1.235e+03 2.828
## degreeFBS in Civil Engineering 2.630e+03 1.165e+03 2.257
## degreeFBS in Computer Engineering 1.417e+03 1.361e+03 1.041
## degreeFBS in Computer Science 2.989e+03 1.120e+03 2.668
## degreeFBS in Electrical Engineering 2.587e+03 1.242e+03 2.083
## degreeFBS in Forestry 1.064e+03 1.502e+03 0.709
## degreeFBS in Industrial Engineering 4.644e+03 1.403e+03 3.310
## degreeFBS in Journalism 2.008e+03 9.880e+02 2.032
## degreeFBS in Landscape Architecture 1.307e+03 1.413e+03 0.925
## degreeFBS in Mechanical Engineering 3.949e+03 1.145e+03 3.450
## degreeFBS in Mining Engineering -1.099e+03 1.907e+03 -0.576
## degreeFBS in Petroleum & Natl Gas Eng 1.960e+03 1.240e+03 1.580
## degreeFBS in Physical Education 2.243e+03 1.546e+03 1.451
## degreeFBS in Recreation -9.628e+02 2.396e+03 -0.402
## degreeFDegree Not Declared 3.068e+02 1.094e+03 0.280
## degreeFRegents Bachelor of Arts 4.693e+02 4.527e+03 0.104
## studentLocAR -3.088e+03 5.206e+03 -0.593
## studentLocBC 2.726e+04 5.161e+03 5.282
## studentLocCA 3.076e+03 2.782e+03 1.106
## studentLocCO 6.352e+03 3.282e+03 1.936
## studentLocCT -1.234e+03 2.762e+03 -0.447
## studentLocDC -5.164e+02 2.883e+03 -0.179
## studentLocDE 1.789e+03 2.816e+03 0.635
## studentLocFL 1.723e+03 2.710e+03 0.636
## studentLocFR 3.600e+03 2.802e+03 1.285
## studentLocGA 6.728e+03 2.768e+03 2.431
## studentLocIL 3.142e+03 2.817e+03 1.115
## studentLocIN 1.097e+04 3.050e+03 3.597
## studentLocKY 2.400e+00 3.114e+03 0.001
## studentLocLA 7.690e+03 5.145e+03 1.495
## studentLocMA 1.840e+02 2.806e+03 0.066
## studentLocMD 1.111e+02 2.623e+03 0.042
## studentLocME -7.309e+02 4.080e+03 -0.179
## studentLocMI 7.481e+03 2.967e+03 2.521
## studentLocMN 9.892e+03 3.667e+03 2.698
## studentLocMO 1.709e+03 5.146e+03 0.332
## studentLocMS 1.875e+03 5.146e+03 0.364
## studentLocMT 2.921e+04 5.160e+03 5.662
## studentLocNC 3.024e+03 2.788e+03 1.085
## studentLocNH -1.978e+03 3.288e+03 -0.602
## studentLocNJ 4.170e+02 2.633e+03 0.158
## studentLocNV 2.138e+03 3.662e+03 0.584
## studentLocNY 5.366e+02 2.645e+03 0.203
## studentLocOH 4.617e+02 2.632e+03 0.175
## studentLocOK 1.366e+04 5.147e+03 2.654
## studentLocON 1.766e+04 3.434e+03 5.142
## studentLocOR 1.042e+04 4.080e+03 2.553
## studentLocPA 1.198e+03 2.620e+03 0.457
## studentLocPR 6.634e+03 5.152e+03 1.288
## studentLocRI -2.387e+02 4.078e+03 -0.059
## studentLocSC 2.603e+03 2.938e+03 0.886
## studentLocSD -1.604e+03 5.158e+03 -0.311
## studentLocTN 1.464e+03 2.854e+03 0.513
## studentLocTX 6.700e+03 2.735e+03 2.450
## studentLocUT -2.490e+02 5.149e+03 -0.048
## studentLocVA -1.078e+02 2.624e+03 -0.041
## studentLocVT -1.725e+03 3.444e+03 -0.501
## studentLocWA 1.165e+03 4.098e+03 0.284
## studentLocWI 2.340e+03 3.107e+03 0.753
## studentLocWV 1.632e+01 2.621e+03 0.006
## proxStudentTypeLong Commute -6.839e+01 4.176e+02 -0.164
## proxStudentTypeShort Commute 1.454e+03 2.077e+02 7.003
## affinityStatusNo Affinity 3.780e+02 1.385e+02 2.730
## expectedFamContrib -1.166e+01 3.067e+00 -3.802
## expectedFamContrib.NATRUE 9.405e+02 4.193e+02 2.243
## aidStudentnonWVUReceived other aid -1.342e+02 2.327e+02 -0.577
## aidStudentPromScholarIs Promise -1.979e+03 2.220e+02 -8.916
## highSchoolGPA 1.037e+01 5.230e+00 1.982
## highSchoolGPA.NATRUE 1.383e+03 6.565e+02 2.107
## highestACT 4.080e+01 6.045e+00 6.749
## highestACT.NATRUE 2.604e+03 3.804e+02 6.844
## totalSAT 6.486e+01 6.527e+00 9.937
## totalSAT.NATRUE 3.268e+03 4.011e+02 8.149
## totalAwardnonWVU -4.975e-02 1.171e-02 -4.250
## Pr(>|t|)
## (Intercept) 0.132185
## studentGenderM 0.663235
## studentEthnBlack < 2e-16 ***
## studentEthnHispanic 0.203528
## studentEthnAsian 0.827756
## studentEthnNative 0.057005 .
## studentEthnUnknown 0.614654
## degreeFAssociate of Arts 0.794198
## degreeFBachelor Engr Tech 0.058203 .
## degreeFBachelor of Arts 0.015408 *
## degreeFBachelor of Fine Arts 0.182852
## degreeFBachelor of Multidisc. Studies 0.192827
## degreeFBachelor of Music 0.002524 **
## degreeFBachelor of Science 0.036484 *
## degreeFBachelor of Science in Nursing 0.480829
## degreeFBachelor of Social Work 0.290813
## degreeFBS in Aerospace Engineering 0.002310 **
## degreeFBS in Agriculture 0.382637
## degreeFBS in Biometric Systems 0.214133
## degreeFBS in Business Administration 0.067219 .
## degreeFBS in Chemical Engineering 0.004702 **
## degreeFBS in Civil Engineering 0.024063 *
## degreeFBS in Computer Engineering 0.298151
## degreeFBS in Computer Science 0.007652 **
## degreeFBS in Electrical Engineering 0.037301 *
## degreeFBS in Forestry 0.478482
## degreeFBS in Industrial Engineering 0.000942 ***
## degreeFBS in Journalism 0.042218 *
## degreeFBS in Landscape Architecture 0.354868
## degreeFBS in Mechanical Engineering 0.000567 ***
## degreeFBS in Mining Engineering 0.564393
## degreeFBS in Petroleum & Natl Gas Eng 0.114072
## degreeFBS in Physical Education 0.146757
## degreeFBS in Recreation 0.687764
## degreeFDegree Not Declared 0.779271
## degreeFRegents Bachelor of Arts 0.917437
## studentLocAR 0.553202
## studentLocBC 1.34e-07 ***
## studentLocCA 0.268947
## studentLocCO 0.052959 .
## studentLocCT 0.655089
## studentLocDC 0.857829
## studentLocDE 0.525397
## studentLocFL 0.524872
## studentLocFR 0.198860
## studentLocGA 0.015115 *
## studentLocIL 0.264789
## studentLocIN 0.000326 ***
## studentLocKY 0.999385
## studentLocLA 0.135076
## studentLocMA 0.947734
## studentLocMD 0.966210
## studentLocME 0.857847
## studentLocMI 0.011740 *
## studentLocMN 0.007009 **
## studentLocMO 0.739846
## studentLocMS 0.715524
## studentLocMT 1.60e-08 ***
## studentLocNC 0.278161
## studentLocNH 0.547529
## studentLocNJ 0.874150
## studentLocNV 0.559385
## studentLocNY 0.839249
## studentLocOH 0.860729
## studentLocOK 0.007981 **
## studentLocON 2.84e-07 ***
## studentLocOR 0.010701 *
## studentLocPA 0.647549
## studentLocPR 0.197937
## studentLocRI 0.953317
## studentLocSC 0.375710
## studentLocSD 0.755826
## studentLocTN 0.608118
## studentLocTX 0.014320 *
## studentLocUT 0.961434
## studentLocVA 0.967222
## studentLocVT 0.616567
## studentLocWA 0.776169
## studentLocWI 0.451488
## studentLocWV 0.995032
## proxStudentTypeLong Commute 0.869913
## proxStudentTypeShort Commute 2.90e-12 ***
## affinityStatusNo Affinity 0.006363 **
## expectedFamContrib 0.000145 ***
## expectedFamContrib.NATRUE 0.024960 *
## aidStudentnonWVUReceived other aid 0.563993
## aidStudentPromScholarIs Promise < 2e-16 ***
## highSchoolGPA 0.047517 *
## highSchoolGPA.NATRUE 0.035163 *
## highestACT 1.68e-11 ***
## highestACT.NATRUE 8.77e-12 ***
## totalSAT < 2e-16 ***
## totalSAT.NATRUE 4.77e-16 ***
## totalAwardnonWVU 2.18e-05 ***
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
##
## Residual standard error: 4424 on 4302 degrees of freedom
## Multiple R-squared: 0.2338, Adjusted R-squared: 0.2172
## F-statistic: 14.11 on 93 and 4302 DF, p-value: < 2.2e-16
anova(modWVUAid_2)
## Analysis of Variance Table
##
## Response: totalAwardWVU
## Df Sum Sq Mean Sq F value Pr(>F)
## studentGender 1 1.5281e+08 152813204 7.8092 0.005221 **
## studentEthn 5 1.8847e+09 376934139 19.2623 < 2.2e-16 ***
## degreeF 29 3.4059e+09 117446285 6.0018 < 2.2e-16 ***
## studentLoc 44 1.1679e+10 265438147 13.5646 < 2.2e-16 ***
## proxStudentType 2 2.2013e+09 1100647812 56.2460 < 2.2e-16 ***
## affinityStatus 1 1.3637e+08 136367153 6.9687 0.008325 **
## expectedFamContrib 1 1.5669e+08 156692734 8.0074 0.004680 **
## expectedFamContrib.NA 1 4.2053e+08 420530903 21.4902 3.662e-06 ***
## aidStudentnonWVU 1 6.7344e+08 673441362 34.4146 4.788e-09 ***
## aidStudentPromScholar 1 7.2936e+08 729362741 37.2723 1.118e-09 ***
## highSchoolGPA 1 8.5486e+07 85486305 4.3686 0.036666 *
## highSchoolGPA.NA 1 1.8821e+08 188212314 9.6181 0.001939 **
## highestACT 1 6.7332e+07 67332023 3.4408 0.063672 .
## highestACT.NA 1 1.4615e+09 1461545051 74.6888 < 2.2e-16 ***
## totalSAT 1 6.9566e+08 695656452 35.5499 2.685e-09 ***
## totalSAT.NA 1 1.3917e+09 1391718584 71.1204 < 2.2e-16 ***
## totalAwardnonWVU 1 3.5353e+08 353534991 18.0666 2.178e-05 ***
## Residuals 4302 8.4184e+10 19568473
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
#model transformation require(MASS) bc <- boxcox(modWVUAid_2)
#The optimal transformation has a parameter close to 0 - use log
#find the approximate mle as the x-value that yields the maximum bc$x[bc$y==max(bc$y)]
modWVUAid_3 <- lm(log(totalAwardWVU) ~ studentGender + studentEthn + degreeF + studentLoc + proxStudentType + affinityStatus + expectedFamContrib + expectedFamContrib.NA + aidStudentnonWVU + aidStudentPromScholar + highestACT + highestACT.NA + totalSAT + totalSAT.NA + totalAwardnonWVU, data = finDataTableWVU_AL12)
summary(modWVUAid_3)
##
## Call:
## lm(formula = log(totalAwardWVU) ~ studentGender + studentEthn +
## degreeF + studentLoc + proxStudentType + affinityStatus +
## expectedFamContrib + expectedFamContrib.NA + aidStudentnonWVU +
## aidStudentPromScholar + highestACT + highestACT.NA + totalSAT +
## totalSAT.NA + totalAwardnonWVU, data = finDataTableWVU_AL12)
##
## Residuals:
## Min 1Q Median 3Q Max
## -4.8253 -0.4349 0.0438 0.4598 2.9691
##
## Coefficients:
## Estimate Std. Error t value
## (Intercept) 5.848e+00 5.285e-01 11.064
## studentGenderM 3.377e-02 2.671e-02 1.264
## studentEthnBlack 5.234e-01 7.040e-02 7.434
## studentEthnHispanic 3.127e-01 1.520e-01 2.057
## studentEthnAsian 4.465e-02 1.201e-01 0.372
## studentEthnNative 5.226e-01 2.970e-01 1.760
## studentEthnUnknown 2.545e-02 2.793e-02 0.911
## degreeFAssociate of Arts 2.050e-01 1.743e-01 1.176
## degreeFBachelor Engr Tech 1.553e+00 5.107e-01 3.042
## degreeFBachelor of Arts 6.537e-01 1.720e-01 3.802
## degreeFBachelor of Fine Arts 4.693e-01 2.035e-01 2.306
## degreeFBachelor of Multidisc. Studies 4.366e-01 1.948e-01 2.241
## degreeFBachelor of Music 1.000e+00 2.007e-01 4.985
## degreeFBachelor of Science 6.412e-01 1.710e-01 3.751
## degreeFBachelor of Science in Nursing 7.286e-01 3.573e-01 2.039
## degreeFBachelor of Social Work 3.920e-01 2.663e-01 1.472
## degreeFBS in Aerospace Engineering 9.210e-01 2.300e-01 4.004
## degreeFBS in Agriculture 4.291e-01 2.318e-01 1.851
## degreeFBS in Biometric Systems 1.014e+00 4.100e-01 2.472
## degreeFBS in Business Administration 5.981e-01 1.756e-01 3.406
## degreeFBS in Chemical Engineering 9.829e-01 2.322e-01 4.233
## degreeFBS in Civil Engineering 7.868e-01 2.192e-01 3.590
## degreeFBS in Computer Engineering 5.770e-01 2.561e-01 2.253
## degreeFBS in Computer Science 8.690e-01 2.107e-01 4.124
## degreeFBS in Electrical Engineering 8.836e-01 2.333e-01 3.787
## degreeFBS in Forestry 3.366e-01 2.825e-01 1.191
## degreeFBS in Industrial Engineering 1.038e+00 2.639e-01 3.933
## degreeFBS in Journalism 6.834e-01 1.859e-01 3.677
## degreeFBS in Landscape Architecture 6.679e-01 2.658e-01 2.512
## degreeFBS in Mechanical Engineering 9.529e-01 2.154e-01 4.425
## degreeFBS in Mining Engineering 1.889e-01 3.589e-01 0.526
## degreeFBS in Petroleum & Natl Gas Eng 7.418e-01 2.331e-01 3.183
## degreeFBS in Physical Education 1.120e+00 2.907e-01 3.852
## degreeFBS in Recreation -2.438e-01 4.507e-01 -0.541
## degreeFDegree Not Declared 3.425e-01 2.056e-01 1.665
## degreeFRegents Bachelor of Arts -4.241e-01 8.498e-01 -0.499
## studentLocAR -6.472e-01 9.796e-01 -0.661
## studentLocBC 2.087e+00 9.709e-01 2.149
## studentLocCA 4.130e-01 5.233e-01 0.789
## studentLocCO 9.177e-01 6.173e-01 1.487
## studentLocCT -5.150e-01 5.195e-01 -0.991
## studentLocDC -2.124e-01 5.422e-01 -0.392
## studentLocDE 1.802e-02 5.298e-01 0.034
## studentLocFL -1.443e-02 5.098e-01 -0.028
## studentLocFR 6.478e-01 5.268e-01 1.230
## studentLocGA 2.825e-01 5.207e-01 0.542
## studentLocIL 3.778e-01 5.301e-01 0.713
## studentLocIN 1.183e+00 5.738e-01 2.062
## studentLocKY -2.906e-01 5.859e-01 -0.496
## studentLocLA 1.489e+00 9.680e-01 1.538
## studentLocMA -2.676e-01 5.280e-01 -0.507
## studentLocMD -2.494e-01 4.935e-01 -0.505
## studentLocME -1.325e-01 7.677e-01 -0.173
## studentLocMI 8.461e-01 5.583e-01 1.515
## studentLocMN 1.075e+00 6.899e-01 1.557
## studentLocMO 4.968e-01 9.677e-01 0.513
## studentLocMS 4.316e-01 9.681e-01 0.446
## studentLocMT 1.873e+00 9.707e-01 1.929
## studentLocNC 3.136e-01 5.245e-01 0.598
## studentLocNH -6.674e-01 6.183e-01 -1.079
## studentLocNJ -1.194e-01 4.953e-01 -0.241
## studentLocNV 5.841e-01 6.890e-01 0.848
## studentLocNY -9.938e-02 4.975e-01 -0.200
## studentLocOH -2.020e-01 4.951e-01 -0.408
## studentLocOK 1.590e+00 9.683e-01 1.642
## studentLocON 1.599e+00 6.461e-01 2.475
## studentLocOR 3.386e-01 7.676e-01 0.441
## studentLocPA 7.746e-02 4.930e-01 0.157
## studentLocPR 1.310e+00 9.692e-01 1.352
## studentLocRI -3.191e-02 7.672e-01 -0.042
## studentLocSC 3.846e-01 5.525e-01 0.696
## studentLocSD -1.349e+00 9.704e-01 -1.390
## studentLocTN 1.903e-01 5.370e-01 0.354
## studentLocTX 8.358e-01 5.145e-01 1.624
## studentLocUT 4.600e-02 9.688e-01 0.047
## studentLocVA -2.396e-01 4.937e-01 -0.485
## studentLocVT -3.640e-01 6.475e-01 -0.562
## studentLocWA 2.328e-01 7.710e-01 0.302
## studentLocWI 3.148e-01 5.844e-01 0.539
## studentLocWV -4.570e-01 4.931e-01 -0.927
## proxStudentTypeLong Commute -3.421e-02 7.857e-02 -0.435
## proxStudentTypeShort Commute 2.836e-01 3.901e-02 7.268
## affinityStatusNo Affinity 1.031e-01 2.605e-02 3.960
## expectedFamContrib -4.893e-04 5.771e-04 -0.848
## expectedFamContrib.NATRUE 5.555e-02 7.888e-02 0.704
## aidStudentnonWVUReceived other aid -1.024e-01 4.377e-02 -2.340
## aidStudentPromScholarIs Promise -2.178e-01 4.090e-02 -5.326
## highestACT 1.418e-02 1.137e-03 12.473
## highestACT.NATRUE 8.026e-01 7.157e-02 11.214
## totalSAT 1.614e-02 1.222e-03 13.211
## totalSAT.NATRUE 7.961e-01 7.509e-02 10.602
## totalAwardnonWVU -1.962e-06 2.200e-06 -0.892
## Pr(>|t|)
## (Intercept) < 2e-16 ***
## studentGenderM 0.206177
## studentEthnBlack 1.26e-13 ***
## studentEthnHispanic 0.039768 *
## studentEthnAsian 0.710125
## studentEthnNative 0.078508 .
## studentEthnUnknown 0.362170
## degreeFAssociate of Arts 0.239690
## degreeFBachelor Engr Tech 0.002368 **
## degreeFBachelor of Arts 0.000146 ***
## degreeFBachelor of Fine Arts 0.021136 *
## degreeFBachelor of Multidisc. Studies 0.025071 *
## degreeFBachelor of Music 6.43e-07 ***
## degreeFBachelor of Science 0.000179 ***
## degreeFBachelor of Science in Nursing 0.041516 *
## degreeFBachelor of Social Work 0.141097
## degreeFBS in Aerospace Engineering 6.33e-05 ***
## degreeFBS in Agriculture 0.064224 .
## degreeFBS in Biometric Systems 0.013465 *
## degreeFBS in Business Administration 0.000664 ***
## degreeFBS in Chemical Engineering 2.35e-05 ***
## degreeFBS in Civil Engineering 0.000334 ***
## degreeFBS in Computer Engineering 0.024309 *
## degreeFBS in Computer Science 3.79e-05 ***
## degreeFBS in Electrical Engineering 0.000154 ***
## degreeFBS in Forestry 0.233577
## degreeFBS in Industrial Engineering 8.53e-05 ***
## degreeFBS in Journalism 0.000239 ***
## degreeFBS in Landscape Architecture 0.012027 *
## degreeFBS in Mechanical Engineering 9.90e-06 ***
## degreeFBS in Mining Engineering 0.598587
## degreeFBS in Petroleum & Natl Gas Eng 0.001469 **
## degreeFBS in Physical Education 0.000119 ***
## degreeFBS in Recreation 0.588619
## degreeFDegree Not Declared 0.095910 .
## degreeFRegents Bachelor of Arts 0.617754
## studentLocAR 0.508875
## studentLocBC 0.031680 *
## studentLocCA 0.429966
## studentLocCO 0.137166
## studentLocCT 0.321599
## studentLocDC 0.695303
## studentLocDE 0.972871
## studentLocFL 0.977421
## studentLocFR 0.218910
## studentLocGA 0.587503
## studentLocIL 0.476037
## studentLocIN 0.039246 *
## studentLocKY 0.619919
## studentLocLA 0.124026
## studentLocMA 0.612365
## studentLocMD 0.613309
## studentLocME 0.863020
## studentLocMI 0.129722
## studentLocMN 0.119429
## studentLocMO 0.607717
## studentLocMS 0.655769
## studentLocMT 0.053750 .
## studentLocNC 0.549873
## studentLocNH 0.280443
## studentLocNJ 0.809446
## studentLocNV 0.396612
## studentLocNY 0.841699
## studentLocOH 0.683316
## studentLocOK 0.100668
## studentLocON 0.013344 *
## studentLocOR 0.659147
## studentLocPA 0.875155
## studentLocPR 0.176590
## studentLocRI 0.966826
## studentLocSC 0.486458
## studentLocSD 0.164525
## studentLocTN 0.723025
## studentLocTX 0.104373
## studentLocUT 0.962135
## studentLocVA 0.627505
## studentLocVT 0.574063
## studentLocWA 0.762663
## studentLocWI 0.590179
## studentLocWV 0.354102
## proxStudentTypeLong Commute 0.663263
## proxStudentTypeShort Commute 4.30e-13 ***
## affinityStatusNo Affinity 7.62e-05 ***
## expectedFamContrib 0.396488
## expectedFamContrib.NATRUE 0.481293
## aidStudentnonWVUReceived other aid 0.019344 *
## aidStudentPromScholarIs Promise 1.05e-07 ***
## highestACT < 2e-16 ***
## highestACT.NATRUE < 2e-16 ***
## totalSAT < 2e-16 ***
## totalSAT.NATRUE < 2e-16 ***
## totalAwardnonWVU 0.372655
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
##
## Residual standard error: 0.8323 on 4304 degrees of freedom
## Multiple R-squared: 0.265, Adjusted R-squared: 0.2495
## F-statistic: 17.06 on 91 and 4304 DF, p-value: < 2.2e-16
anova(modWVUAid_3)
## Analysis of Variance Table
##
## Response: log(totalAwardWVU)
## Df Sum Sq Mean Sq F value Pr(>F)
## studentGender 1 21.55 21.549 31.1057 2.593e-08 ***
## studentEthn 5 55.42 11.085 16.0008 1.177e-15 ***
## degreeF 29 234.38 8.082 11.6667 < 2.2e-16 ***
## studentLoc 44 384.10 8.730 12.6011 < 2.2e-16 ***
## proxStudentType 2 70.79 35.393 51.0893 < 2.2e-16 ***
## affinityStatus 1 7.77 7.769 11.2140 0.0008188 ***
## expectedFamContrib 1 0.88 0.882 1.2726 0.2593360
## expectedFamContrib.NA 1 3.79 3.788 5.4677 0.0194162 *
## aidStudentnonWVU 1 13.16 13.158 18.9929 1.343e-05 ***
## aidStudentPromScholar 1 0.83 0.827 1.1939 0.2746112
## highestACT 1 26.34 26.339 38.0204 7.644e-10 ***
## highestACT.NA 1 129.19 129.192 186.4876 < 2.2e-16 ***
## totalSAT 1 47.31 47.313 68.2967 < 2.2e-16 ***
## totalSAT.NA 1 79.12 79.123 114.2140 < 2.2e-16 ***
## totalAwardnonWVU 1 0.55 0.551 0.7950 0.3726546
## Residuals 4304 2981.66 0.693
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
ncvTest(modWVUAid_3)
## Non-constant Variance Score Test
## Variance formula: ~ fitted.values
## Chisquare = 7.722425 Df = 1 p = 0.005453909
plot(modWVUAid_3)
## Warning: not plotting observations with leverage one:
## 2168, 2288, 4123, 4238, 4358, 4374
## Warning: not plotting observations with leverage one:
## 2168, 2288, 4123, 4238, 4358, 4374
## Warning in sqrt(crit * p * (1 - hh)/hh): NaNs produced
## Warning in sqrt(crit * p * (1 - hh)/hh): NaNs produced
mmp(modWVUAid_3, sd = TRUE)
residualPlot(modWVUAid_3)
summary(modWVUAid_3)
##
## Call:
## lm(formula = log(totalAwardWVU) ~ studentGender + studentEthn +
## degreeF + studentLoc + proxStudentType + affinityStatus +
## expectedFamContrib + expectedFamContrib.NA + aidStudentnonWVU +
## aidStudentPromScholar + highestACT + highestACT.NA + totalSAT +
## totalSAT.NA + totalAwardnonWVU, data = finDataTableWVU_AL12)
##
## Residuals:
## Min 1Q Median 3Q Max
## -4.8253 -0.4349 0.0438 0.4598 2.9691
##
## Coefficients:
## Estimate Std. Error t value
## (Intercept) 5.848e+00 5.285e-01 11.064
## studentGenderM 3.377e-02 2.671e-02 1.264
## studentEthnBlack 5.234e-01 7.040e-02 7.434
## studentEthnHispanic 3.127e-01 1.520e-01 2.057
## studentEthnAsian 4.465e-02 1.201e-01 0.372
## studentEthnNative 5.226e-01 2.970e-01 1.760
## studentEthnUnknown 2.545e-02 2.793e-02 0.911
## degreeFAssociate of Arts 2.050e-01 1.743e-01 1.176
## degreeFBachelor Engr Tech 1.553e+00 5.107e-01 3.042
## degreeFBachelor of Arts 6.537e-01 1.720e-01 3.802
## degreeFBachelor of Fine Arts 4.693e-01 2.035e-01 2.306
## degreeFBachelor of Multidisc. Studies 4.366e-01 1.948e-01 2.241
## degreeFBachelor of Music 1.000e+00 2.007e-01 4.985
## degreeFBachelor of Science 6.412e-01 1.710e-01 3.751
## degreeFBachelor of Science in Nursing 7.286e-01 3.573e-01 2.039
## degreeFBachelor of Social Work 3.920e-01 2.663e-01 1.472
## degreeFBS in Aerospace Engineering 9.210e-01 2.300e-01 4.004
## degreeFBS in Agriculture 4.291e-01 2.318e-01 1.851
## degreeFBS in Biometric Systems 1.014e+00 4.100e-01 2.472
## degreeFBS in Business Administration 5.981e-01 1.756e-01 3.406
## degreeFBS in Chemical Engineering 9.829e-01 2.322e-01 4.233
## degreeFBS in Civil Engineering 7.868e-01 2.192e-01 3.590
## degreeFBS in Computer Engineering 5.770e-01 2.561e-01 2.253
## degreeFBS in Computer Science 8.690e-01 2.107e-01 4.124
## degreeFBS in Electrical Engineering 8.836e-01 2.333e-01 3.787
## degreeFBS in Forestry 3.366e-01 2.825e-01 1.191
## degreeFBS in Industrial Engineering 1.038e+00 2.639e-01 3.933
## degreeFBS in Journalism 6.834e-01 1.859e-01 3.677
## degreeFBS in Landscape Architecture 6.679e-01 2.658e-01 2.512
## degreeFBS in Mechanical Engineering 9.529e-01 2.154e-01 4.425
## degreeFBS in Mining Engineering 1.889e-01 3.589e-01 0.526
## degreeFBS in Petroleum & Natl Gas Eng 7.418e-01 2.331e-01 3.183
## degreeFBS in Physical Education 1.120e+00 2.907e-01 3.852
## degreeFBS in Recreation -2.438e-01 4.507e-01 -0.541
## degreeFDegree Not Declared 3.425e-01 2.056e-01 1.665
## degreeFRegents Bachelor of Arts -4.241e-01 8.498e-01 -0.499
## studentLocAR -6.472e-01 9.796e-01 -0.661
## studentLocBC 2.087e+00 9.709e-01 2.149
## studentLocCA 4.130e-01 5.233e-01 0.789
## studentLocCO 9.177e-01 6.173e-01 1.487
## studentLocCT -5.150e-01 5.195e-01 -0.991
## studentLocDC -2.124e-01 5.422e-01 -0.392
## studentLocDE 1.802e-02 5.298e-01 0.034
## studentLocFL -1.443e-02 5.098e-01 -0.028
## studentLocFR 6.478e-01 5.268e-01 1.230
## studentLocGA 2.825e-01 5.207e-01 0.542
## studentLocIL 3.778e-01 5.301e-01 0.713
## studentLocIN 1.183e+00 5.738e-01 2.062
## studentLocKY -2.906e-01 5.859e-01 -0.496
## studentLocLA 1.489e+00 9.680e-01 1.538
## studentLocMA -2.676e-01 5.280e-01 -0.507
## studentLocMD -2.494e-01 4.935e-01 -0.505
## studentLocME -1.325e-01 7.677e-01 -0.173
## studentLocMI 8.461e-01 5.583e-01 1.515
## studentLocMN 1.075e+00 6.899e-01 1.557
## studentLocMO 4.968e-01 9.677e-01 0.513
## studentLocMS 4.316e-01 9.681e-01 0.446
## studentLocMT 1.873e+00 9.707e-01 1.929
## studentLocNC 3.136e-01 5.245e-01 0.598
## studentLocNH -6.674e-01 6.183e-01 -1.079
## studentLocNJ -1.194e-01 4.953e-01 -0.241
## studentLocNV 5.841e-01 6.890e-01 0.848
## studentLocNY -9.938e-02 4.975e-01 -0.200
## studentLocOH -2.020e-01 4.951e-01 -0.408
## studentLocOK 1.590e+00 9.683e-01 1.642
## studentLocON 1.599e+00 6.461e-01 2.475
## studentLocOR 3.386e-01 7.676e-01 0.441
## studentLocPA 7.746e-02 4.930e-01 0.157
## studentLocPR 1.310e+00 9.692e-01 1.352
## studentLocRI -3.191e-02 7.672e-01 -0.042
## studentLocSC 3.846e-01 5.525e-01 0.696
## studentLocSD -1.349e+00 9.704e-01 -1.390
## studentLocTN 1.903e-01 5.370e-01 0.354
## studentLocTX 8.358e-01 5.145e-01 1.624
## studentLocUT 4.600e-02 9.688e-01 0.047
## studentLocVA -2.396e-01 4.937e-01 -0.485
## studentLocVT -3.640e-01 6.475e-01 -0.562
## studentLocWA 2.328e-01 7.710e-01 0.302
## studentLocWI 3.148e-01 5.844e-01 0.539
## studentLocWV -4.570e-01 4.931e-01 -0.927
## proxStudentTypeLong Commute -3.421e-02 7.857e-02 -0.435
## proxStudentTypeShort Commute 2.836e-01 3.901e-02 7.268
## affinityStatusNo Affinity 1.031e-01 2.605e-02 3.960
## expectedFamContrib -4.893e-04 5.771e-04 -0.848
## expectedFamContrib.NATRUE 5.555e-02 7.888e-02 0.704
## aidStudentnonWVUReceived other aid -1.024e-01 4.377e-02 -2.340
## aidStudentPromScholarIs Promise -2.178e-01 4.090e-02 -5.326
## highestACT 1.418e-02 1.137e-03 12.473
## highestACT.NATRUE 8.026e-01 7.157e-02 11.214
## totalSAT 1.614e-02 1.222e-03 13.211
## totalSAT.NATRUE 7.961e-01 7.509e-02 10.602
## totalAwardnonWVU -1.962e-06 2.200e-06 -0.892
## Pr(>|t|)
## (Intercept) < 2e-16 ***
## studentGenderM 0.206177
## studentEthnBlack 1.26e-13 ***
## studentEthnHispanic 0.039768 *
## studentEthnAsian 0.710125
## studentEthnNative 0.078508 .
## studentEthnUnknown 0.362170
## degreeFAssociate of Arts 0.239690
## degreeFBachelor Engr Tech 0.002368 **
## degreeFBachelor of Arts 0.000146 ***
## degreeFBachelor of Fine Arts 0.021136 *
## degreeFBachelor of Multidisc. Studies 0.025071 *
## degreeFBachelor of Music 6.43e-07 ***
## degreeFBachelor of Science 0.000179 ***
## degreeFBachelor of Science in Nursing 0.041516 *
## degreeFBachelor of Social Work 0.141097
## degreeFBS in Aerospace Engineering 6.33e-05 ***
## degreeFBS in Agriculture 0.064224 .
## degreeFBS in Biometric Systems 0.013465 *
## degreeFBS in Business Administration 0.000664 ***
## degreeFBS in Chemical Engineering 2.35e-05 ***
## degreeFBS in Civil Engineering 0.000334 ***
## degreeFBS in Computer Engineering 0.024309 *
## degreeFBS in Computer Science 3.79e-05 ***
## degreeFBS in Electrical Engineering 0.000154 ***
## degreeFBS in Forestry 0.233577
## degreeFBS in Industrial Engineering 8.53e-05 ***
## degreeFBS in Journalism 0.000239 ***
## degreeFBS in Landscape Architecture 0.012027 *
## degreeFBS in Mechanical Engineering 9.90e-06 ***
## degreeFBS in Mining Engineering 0.598587
## degreeFBS in Petroleum & Natl Gas Eng 0.001469 **
## degreeFBS in Physical Education 0.000119 ***
## degreeFBS in Recreation 0.588619
## degreeFDegree Not Declared 0.095910 .
## degreeFRegents Bachelor of Arts 0.617754
## studentLocAR 0.508875
## studentLocBC 0.031680 *
## studentLocCA 0.429966
## studentLocCO 0.137166
## studentLocCT 0.321599
## studentLocDC 0.695303
## studentLocDE 0.972871
## studentLocFL 0.977421
## studentLocFR 0.218910
## studentLocGA 0.587503
## studentLocIL 0.476037
## studentLocIN 0.039246 *
## studentLocKY 0.619919
## studentLocLA 0.124026
## studentLocMA 0.612365
## studentLocMD 0.613309
## studentLocME 0.863020
## studentLocMI 0.129722
## studentLocMN 0.119429
## studentLocMO 0.607717
## studentLocMS 0.655769
## studentLocMT 0.053750 .
## studentLocNC 0.549873
## studentLocNH 0.280443
## studentLocNJ 0.809446
## studentLocNV 0.396612
## studentLocNY 0.841699
## studentLocOH 0.683316
## studentLocOK 0.100668
## studentLocON 0.013344 *
## studentLocOR 0.659147
## studentLocPA 0.875155
## studentLocPR 0.176590
## studentLocRI 0.966826
## studentLocSC 0.486458
## studentLocSD 0.164525
## studentLocTN 0.723025
## studentLocTX 0.104373
## studentLocUT 0.962135
## studentLocVA 0.627505
## studentLocVT 0.574063
## studentLocWA 0.762663
## studentLocWI 0.590179
## studentLocWV 0.354102
## proxStudentTypeLong Commute 0.663263
## proxStudentTypeShort Commute 4.30e-13 ***
## affinityStatusNo Affinity 7.62e-05 ***
## expectedFamContrib 0.396488
## expectedFamContrib.NATRUE 0.481293
## aidStudentnonWVUReceived other aid 0.019344 *
## aidStudentPromScholarIs Promise 1.05e-07 ***
## highestACT < 2e-16 ***
## highestACT.NATRUE < 2e-16 ***
## totalSAT < 2e-16 ***
## totalSAT.NATRUE < 2e-16 ***
## totalAwardnonWVU 0.372655
## ---
## Signif. codes: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
##
## Residual standard error: 0.8323 on 4304 degrees of freedom
## Multiple R-squared: 0.265, Adjusted R-squared: 0.2495
## F-statistic: 17.06 on 91 and 4304 DF, p-value: < 2.2e-16
#test model predictions
names(finDataTableWVU_AL12)
## [1] "rule49Grant" "instEmployAid"
## [3] "instGrantAcademic" "instGrantAthletic"
## [5] "instGrantOther" "studentGender"
## [7] "studentEthn" "degreeF"
## [9] "degreeType" "studentLoc"
## [11] "stateIndicator" "proxStudentType"
## [13] "highSchoolGPA" "prevColGPA"
## [15] "highestACT" "totalSAT"
## [17] "scoreGED" "scaledAcademAchiev"
## [19] "affinityStatus" "expectedFamContrib"
## [21] "totalAwardWVU" "totalAwardnonWVU"
## [23] "totalAwardPromScholar" "aidStudentWVU"
## [25] "aidStudentnonWVU" "aidStudentPromScholar"
## [27] "highSchoolGPA.NA" "prevColGPA.NA"
## [29] "highestACT.NA" "totalSAT.NA"
## [31] "scoreGED.NA" "expectedFamContrib.NA"
## [33] "studentEthn.NA" "scaledAcademAchiev.NA"
which(finDataTableWVU_AL12[,21] > 40000)
## [1] 813 2031 4053 4098 4124
fitResults <- predict(modWVUAid_3, newdata = finDataTableWVU_AL12[813,], type = "response")
exp(fitResults)
## 1355
## 2114.119
finDataTableWVU_AL12[813, 21]
## [1] 41170
finDataTableWVU_AL12$predictedAwardWVU <-exp(predict(modWVUAid_3))
```